1 /* Conversion from and to IBM932.
2    Copyright (C) 2000-2022 Free Software Foundation, Inc.
3    This file is part of the GNU C Library.
4 
5    The GNU C Library is free software; you can redistribute it and/or
6    modify it under the terms of the GNU Lesser General Public
7    License as published by the Free Software Foundation; either
8    version 2.1 of the License, or (at your option) any later version.
9 
10    The GNU C Library is distributed in the hope that it will be useful,
11    but WITHOUT ANY WARRANTY; without even the implied warranty of
12    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13    Lesser General Public License for more details.
14 
15    You should have received a copy of the GNU Lesser General Public
16    License along with the GNU C Library; if not, see
17    <https://www.gnu.org/licenses/>.  */
18 
19 #include <dlfcn.h>
20 #include <stdint.h>
21 #include <stdbool.h>
22 #include "ibm932.h"
23 
24 #define FROM	0
25 #define TO	1
26 
27 /* Definitions used in the body of the `gconv' function.  */
28 #define CHARSET_NAME	"IBM932//"
29 #define FROM_LOOP	from_ibm932
30 #define TO_LOOP		to_ibm932
31 #define ONE_DIRECTION	0
32 
33 /* Definitions of initialization and destructor function.  */
34 #define DEFINE_INIT	1
35 #define DEFINE_FINI	1
36 
37 #define MIN_NEEDED_FROM	1
38 #define MAX_NEEDED_FROM	2
39 #define MIN_NEEDED_TO	4
40 
41 /* First, define the conversion function from IBM-932 to UCS4.  */
42 #define MIN_NEEDED_INPUT	MIN_NEEDED_FROM
43 #define MAX_NEEDED_INPUT	MAX_NEEDED_FROM
44 #define MIN_NEEDED_OUTPUT	MIN_NEEDED_TO
45 #define LOOPFCT			FROM_LOOP
46 #define BODY \
47   {									      \
48     const struct gap *rp2 = __ibm932db_to_ucs4_idx;			      \
49     uint32_t ch = *inptr;						      \
50     uint32_t res;							      \
51 									      \
52     if (__builtin_expect (ch == 0x80, 0)				      \
53 	|| __builtin_expect (ch == 0xa0, 0)				      \
54 	|| __builtin_expect (ch == 0xfd, 0)				      \
55 	|| __builtin_expect (ch == 0xfe, 0)				      \
56 	|| __builtin_expect (ch == 0xff, 0))				      \
57       {									      \
58 	/* This is an illegal character.  */				      \
59 	STANDARD_FROM_LOOP_ERR_HANDLER (1);				      \
60       }									      \
61 									      \
62     /* Use the IBM932 table for single byte.  */			      \
63     res = __ibm932sb_to_ucs4[ch];					      \
64     if (__builtin_expect (res == 0, 0) && ch != 0)			      \
65       {									      \
66 	/* Use the IBM932 table for double byte.  */			      \
67 	if (__glibc_unlikely (inptr + 1 >= inend))			      \
68 	  {								      \
69 	    /* The second character is not available.			      \
70 	       Store the intermediate result.  */			      \
71 	    result = __GCONV_INCOMPLETE_INPUT;				      \
72 	    break;							      \
73 	  }								      \
74 									      \
75 	ch = (ch * 0x100) + inptr[1];					      \
76 	/* ch was less than 0xfd.  */					      \
77 	assert (ch < 0xfd00);						      \
78 	while (ch > rp2->end)						      \
79 	  ++rp2;							      \
80 									      \
81 	if (__builtin_expect (ch < rp2->start, 0)			      \
82 	    || (res = __ibm932db_to_ucs4[ch + rp2->idx],		      \
83 	    __builtin_expect (res, '\1') == 0 && ch !=0))		      \
84 	  {								      \
85 	    /* This is an illegal character.  */			      \
86 	    STANDARD_FROM_LOOP_ERR_HANDLER (2);				      \
87 	  }								      \
88 	else								      \
89 	  {								      \
90 	    put32 (outptr, res);					      \
91 	    outptr += 4;						      \
92 	    inptr += 2;							      \
93 	  }								      \
94       }									      \
95     else								      \
96       {									      \
97 	if (res == 0xa5)						      \
98 	  res = 0x5c;							      \
99 	else if (res == 0x203e)						      \
100 	  res = 0x7e;							      \
101 	put32 (outptr, res);						      \
102 	outptr += 4;							      \
103 	inptr++;							      \
104       }									      \
105   }
106 #define LOOP_NEED_FLAGS
107 #define ONEBYTE_BODY \
108   {									      \
109     if (c == 0x80 || c == 0xa0 || c >= 0xfd)				      \
110       return WEOF;							      \
111     uint32_t res = __ibm932sb_to_ucs4[c];				      \
112     if (res == 0 && c != 0)						      \
113       return WEOF;							      \
114     if (res == 0xa5)						              \
115       res = 0x5c;							      \
116     else if (res == 0x203e)						      \
117       res = 0x7e;							      \
118     return res;								      \
119   }
120 #include <iconv/loop.c>
121 
122 /* Next, define the other direction.  */
123 #define MIN_NEEDED_INPUT	MIN_NEEDED_TO
124 #define MIN_NEEDED_OUTPUT	MIN_NEEDED_FROM
125 #define MAX_NEEDED_OUTPUT	MAX_NEEDED_FROM
126 #define LOOPFCT			TO_LOOP
127 #define BODY \
128   {									      \
129     const struct gap *rp = __ucs4_to_ibm932sb_idx;			      \
130     unsigned char sc;							      \
131     uint32_t ch = get32 (inptr);					      \
132     bool found = true;							      \
133     uint32_t i;								      \
134     uint32_t low;							      \
135     uint32_t high;							      \
136     uint16_t pccode;							      \
137 									      \
138     if (__glibc_unlikely (ch >= 0xffff))				      \
139       {									      \
140 	UNICODE_TAG_HANDLER (ch, 4);					      \
141 	rp = NULL;							      \
142       }									      \
143     else								      \
144       while (ch > rp->end)						      \
145 	++rp;								      \
146 									      \
147     /* Use the UCS4 table for single byte.  */				      \
148     if (__builtin_expect (rp == NULL, 0)				      \
149 	|| __builtin_expect (ch < rp->start, 0)				      \
150 	|| (sc = __ucs4_to_ibm932sb[ch + rp->idx],			      \
151 	__builtin_expect (sc, '\1') == '\0' && ch != L'\0'))		      \
152       {									      \
153 									      \
154 	/* Use the UCS4 table for double byte.  */			      \
155 	found = false;							      \
156 	low = 0;							      \
157 	high = (sizeof (__ucs4_to_ibm932db) >> 1)			      \
158 		/ sizeof (__ucs4_to_ibm932db[0][FROM]);			      \
159 	pccode = ch;							      \
160 	if (__glibc_likely (rp != NULL))				      \
161 	  while (low < high)						      \
162 	    {								      \
163 	      i = (low + high) >> 1;					      \
164 	      if (pccode < __ucs4_to_ibm932db[i][FROM])			      \
165 		high = i;						      \
166 	      else if (pccode > __ucs4_to_ibm932db[i][FROM])		      \
167 		low = i + 1;						      \
168 	      else 							      \
169 		{							      \
170 		  pccode = __ucs4_to_ibm932db[i][TO];			      \
171 		  found = true;						      \
172 		  break;						      \
173 		}							      \
174 	    }								      \
175 	if (found) 							      \
176 	  {								      \
177 	    if (__glibc_unlikely (outptr + 2 > outend))			      \
178 	      {								      \
179 		result = __GCONV_FULL_OUTPUT;				      \
180 		break;							      \
181 	      }								      \
182 	    *outptr++ = pccode >> 8 & 0xff;				      \
183 	    *outptr++ = pccode & 0xff;					      \
184 	  }								      \
185 	else								      \
186 	  {								      \
187 	    /* This is an illegal character.  */			      \
188 	    STANDARD_TO_LOOP_ERR_HANDLER (4);				      \
189 	  }								      \
190       }									      \
191     else								      \
192       {									      \
193 	if (__glibc_unlikely (outptr + 1 > outend))			      \
194 	  {								      \
195 	    result = __GCONV_FULL_OUTPUT;				      \
196 	    break;							      \
197 	  }								      \
198 	if (ch == 0x5c)							      \
199 	  *outptr++ = 0x5c;						      \
200 	else if (ch == 0x7e)						      \
201 	  *outptr++ = 0x7e;						      \
202 	else								      \
203 	  *outptr++ = sc;						      \
204       }									      \
205 									      \
206     /* Now that we wrote the output increment the input pointer.  */	      \
207     inptr += 4;								      \
208   }
209 #define LOOP_NEED_FLAGS
210 #include <iconv/loop.c>
211 
212 /* Now define the toplevel functions.  */
213 #include <iconv/skeleton.c>
214