xref: /illumos-gate/usr/src/lib/libc/port/locale/iswctype.c (revision b6805bf78d2bbbeeaea8909a05623587b42d58b3)
1 /*
2  * Copyright 2010 Nexenta Systems, Inc.  All rights reserved.
3  * Copyright (c) 1989, 1993
4  *	The Regents of the University of California.  All rights reserved.
5  * (c) UNIX System Laboratories, Inc.
6  * All or some portions of this file are derived from material licensed
7  * to the University of California by American Telephone and Telegraph
8  * Co. or Unix System Laboratories, Inc. and are reproduced herein with
9  * the permission of UNIX System Laboratories, Inc.
10  *
11  * This code is derived from software contributed to Berkeley by
12  * Paul Borman at Krystal Technologies.
13  *
14  * Redistribution and use in source and binary forms, with or without
15  * modification, are permitted provided that the following conditions
16  * are met:
17  * 1. Redistributions of source code must retain the above copyright
18  *    notice, this list of conditions and the following disclaimer.
19  * 2. Redistributions in binary form must reproduce the above copyright
20  *    notice, this list of conditions and the following disclaimer in the
21  *    documentation and/or other materials provided with the distribution.
22  * 4. Neither the name of the University nor the names of its contributors
23  *    may be used to endorse or promote products derived from this software
24  *    without specific prior written permission.
25  *
26  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
27  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
28  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
29  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
30  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
31  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
32  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
33  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
34  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
35  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
36  * SUCH DAMAGE.
37  */
38 
39 #include "lint.h"
40 #include <wctype.h>
41 #include "runefile.h"
42 #include "runetype.h"
43 #include "_ctype.h"
44 
45 /*
46  * We removed: iswascii, iswhexnumber, and iswnumber, as
47  * these are not present on Solaris.  Note that the standard requires
48  * iswascii to be a macro, so it is defined in our headers.
49  *
50  * We renamed (per Solaris) iswideogram, iswspecial, iswspecial to the
51  * equivalent values without "w".  We added a new isnumber, that looks
52  * for non-ASCII numbers.
53  */
54 
55 static int
56 __istype(wint_t c, unsigned int f)
57 {
58 	unsigned int rt;
59 
60 	/* Fast path for single byte locales */
61 	if (c < 0 || c >= _CACHED_RUNES)
62 		rt =  ___runetype(c);
63 	else
64 		rt = _CurrentRuneLocale->__runetype[c];
65 	return (rt & f);
66 }
67 
68 static int
69 __isctype(wint_t c, unsigned int f)
70 {
71 	unsigned int rt;
72 
73 	/* Fast path for single byte locales */
74 	if (c < 0 || c >= _CACHED_RUNES)
75 		return (0);
76 	else
77 		rt = _CurrentRuneLocale->__runetype[c];
78 	return (rt & f);
79 }
80 
81 #undef iswctype
82 int
83 iswctype(wint_t wc, wctype_t class)
84 {
85 	return (__istype(wc, class));
86 }
87 
88 #undef _iswctype
89 unsigned
90 _iswctype(wchar_t wc, int class)
91 {
92 	return (__istype((wint_t)wc, (unsigned int)class));
93 }
94 
95 #undef iswalnum
96 int
97 iswalnum(wint_t wc)
98 {
99 	return (__istype(wc, _CTYPE_A|_CTYPE_D));
100 }
101 
102 #undef iswalpha
103 int
104 iswalpha(wint_t wc)
105 {
106 	return (__istype(wc, _CTYPE_A));
107 }
108 
109 #undef iswblank
110 int
111 iswblank(wint_t wc)
112 {
113 	return (__istype(wc, _CTYPE_B));
114 }
115 
116 #undef iswcntrl
117 int
118 iswcntrl(wint_t wc)
119 {
120 	return (__istype(wc, _CTYPE_C));
121 }
122 
123 #undef iswdigit
124 int
125 iswdigit(wint_t wc)
126 {
127 	return (__isctype(wc, _CTYPE_D));
128 }
129 
130 #undef iswgraph
131 int
132 iswgraph(wint_t wc)
133 {
134 	return (__istype(wc, _CTYPE_G));
135 }
136 
137 #undef isideogram
138 int
139 isideogram(wint_t wc)
140 {
141 	return (__istype(wc, _CTYPE_I));
142 }
143 
144 #undef iswlower
145 int
146 iswlower(wint_t wc)
147 {
148 	return (__istype(wc, _CTYPE_L));
149 }
150 
151 #undef isphonogram
152 int
153 isphonogram(wint_t wc)
154 {
155 	return (__istype(wc, _CTYPE_Q));
156 }
157 
158 #undef iswprint
159 int
160 iswprint(wint_t wc)
161 {
162 	return (__istype(wc, _CTYPE_R));
163 }
164 
165 #undef iswpunct
166 int
167 iswpunct(wint_t wc)
168 {
169 	return (__istype(wc, _CTYPE_P));
170 }
171 
172 #undef iswspace
173 int
174 iswspace(wint_t wc)
175 {
176 	return (__istype(wc, _CTYPE_S));
177 }
178 
179 #undef iswupper
180 int
181 iswupper(wint_t wc)
182 {
183 	return (__istype(wc, _CTYPE_U));
184 }
185 
186 #undef iswxdigit
187 int
188 iswxdigit(wint_t wc)
189 {
190 	return (__isctype(wc, _CTYPE_X));
191 }
192 
193 #undef isenglish
194 int
195 isenglish(wint_t wc)
196 {
197 	return (__istype(wc, _CTYPE_E));
198 }
199 
200 #undef isspecial
201 int
202 isspecial(wint_t wc)
203 {
204 	return (__istype(wc, _CTYPE_T));
205 }
206 
207 #undef isnumber
208 int
209 isnumber(wint_t wc)
210 {
211 	return (__istype(wc, _CTYPE_N));
212 }
213 
214 /*
215  * FreeBSD has iswrune() for use by external programs, and this is used by
216  * the "tr" program.  As that program is part of our consolidation, we
217  * provide an _ILLUMOS_PRIVATE version of this function that we can use.
218  *
219  * No programs that are not part of the illumos stack itself should use
220  * this function -- programs that do reference will not be portable to
221  * other versions of SunOS or Solaris.
222  */
223 int
224 __iswrune(wint_t wc)
225 {
226 	/*
227 	 * Note, FreeBSD ignored the low order byte, as they encode their
228 	 * ctype values differently.  We can't do that (ctype is baked into
229 	 * applications), but instead can just check if *any* bit is set in
230 	 * the ctype.  Any bit being set indicates its a valid rune.
231 	 */
232 	return (__istype(wc, 0xffffffffU));
233 }
234