1 /* Copyright (C) 2011-2022 Free Software Foundation, Inc.
2    This file is part of the GNU C Library.
3 
4    The GNU C Library is free software; you can redistribute it and/or
5    modify it under the terms of the GNU Lesser General Public
6    License as published by the Free Software Foundation; either
7    version 2.1 of the License, or (at your option) any later version.
8 
9    The GNU C Library is distributed in the hope that it will be useful,
10    but WITHOUT ANY WARRANTY; without even the implied warranty of
11    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
12    Lesser General Public License for more details.
13 
14    You should have received a copy of the GNU Lesser General Public
15    License along with the GNU C Library; if not, see
16    <https://www.gnu.org/licenses/>.  */
17 
18 #include <assert.h>
19 #include <dlfcn.h>
20 #include <errno.h>
21 #include <gconv.h>
22 #include <uchar.h>
23 #include <wcsmbsload.h>
24 
25 #include <sysdep.h>
26 
27 #ifndef EILSEQ
28 # define EILSEQ EINVAL
29 #endif
30 
31 
32 /* This is the private state used if PS is NULL.  */
33 static mbstate_t state;
34 
35 size_t
mbrtoc16(char16_t * pc16,const char * s,size_t n,mbstate_t * ps)36 mbrtoc16 (char16_t *pc16, const char *s, size_t n, mbstate_t *ps)
37 {
38   if (ps == NULL)
39     ps = &state;
40 
41   /* The standard text does not say that S being NULL means the state
42      is reset even if the second half of a surrogate still have to be
43      returned.  In fact, the error code description indicates
44      otherwise.  Therefore always first try to return a second
45      half.  */
46   if (ps->__count & 0x80000000)
47     {
48       /* We have to return the second word for a surrogate.  */
49       ps->__count &= 0x7fffffff;
50       *pc16 = ps->__value.__wch;
51       ps->__value.__wch = L'\0';
52       return (size_t) -3;
53     }
54 
55   wchar_t wc;
56   struct __gconv_step_data data;
57   int status;
58   size_t result;
59   size_t dummy;
60   const unsigned char *inbuf, *endbuf;
61   unsigned char *outbuf = (unsigned char *) &wc;
62   const struct gconv_fcts *fcts;
63 
64   /* Set information for this step.  */
65   data.__invocation_counter = 0;
66   data.__internal_use = 1;
67   data.__flags = __GCONV_IS_LAST;
68   data.__statep = ps;
69 
70   /* A first special case is if S is NULL.  This means put PS in the
71      initial state.  */
72   if (s == NULL)
73     {
74       pc16 = NULL;
75       s = "";
76       n = 1;
77     }
78 
79   if (n == 0)
80     return (size_t) -2;
81 
82   /* Tell where we want the result.  */
83   data.__outbuf = outbuf;
84   data.__outbufend = outbuf + sizeof (wchar_t);
85 
86   /* Get the conversion functions.  */
87   fcts = get_gconv_fcts (_NL_CURRENT_DATA (LC_CTYPE));
88 
89   /* Do a normal conversion.  */
90   inbuf = (const unsigned char *) s;
91   endbuf = inbuf + n;
92   if (__glibc_unlikely (endbuf < inbuf))
93     {
94       endbuf = (const unsigned char *) ~(uintptr_t) 0;
95       if (endbuf == inbuf)
96 	goto ilseq;
97     }
98   __gconv_fct fct = fcts->towc->__fct;
99 #ifdef PTR_DEMANGLE
100   if (fcts->towc->__shlib_handle != NULL)
101     PTR_DEMANGLE (fct);
102 #endif
103 
104   status = DL_CALL_FCT (fct, (fcts->towc, &data, &inbuf, endbuf,
105 			      NULL, &dummy, 0, 1));
106 
107   /* There must not be any problems with the conversion but illegal input
108      characters.  The output buffer must be large enough, otherwise the
109      definition of MB_CUR_MAX is not correct.  All the other possible
110      errors also must not happen.  */
111   assert (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT
112 	  || status == __GCONV_ILLEGAL_INPUT
113 	  || status == __GCONV_INCOMPLETE_INPUT
114 	  || status == __GCONV_FULL_OUTPUT);
115 
116   if (status == __GCONV_OK || status == __GCONV_EMPTY_INPUT
117       || status == __GCONV_FULL_OUTPUT)
118     {
119       result = inbuf - (const unsigned char *) s;
120 
121       if (wc < 0x10000)
122 	{
123 	  if (pc16 != NULL)
124 	    *pc16 = wc;
125 
126 	  if (data.__outbuf != outbuf && wc == L'\0')
127 	    {
128 	      /* The converted character is the NUL character.  */
129 	      assert (__mbsinit (data.__statep));
130 	      result = 0;
131 	    }
132 	}
133       else
134 	{
135 	  /* This is a surrogate.  */
136 	  if (pc16 != NULL)
137 	    *pc16 = 0xd7c0 + (wc >> 10);
138 
139 	  ps->__count |= 0x80000000;
140 	  ps->__value.__wch = 0xdc00 + (wc & 0x3ff);
141 	}
142     }
143   else if (status == __GCONV_INCOMPLETE_INPUT)
144     result = (size_t) -2;
145   else
146     {
147     ilseq:
148       result = (size_t) -1;
149       __set_errno (EILSEQ);
150     }
151 
152   return result;
153 }
154