1 /* 2 * Copyright 2013 Garrett D'Amore <garrett@damore.org> 3 * Copyright 2017 Nexenta Systems, Inc. 4 * Copyright (c) 1993 5 * The Regents of the University of California. All rights reserved. 6 * 7 * This code is derived from software contributed to Berkeley by 8 * Paul Borman at Krystal Technologies. 9 * 10 * Redistribution and use in source and binary forms, with or without 11 * modification, are permitted provided that the following conditions 12 * are met: 13 * 1. Redistributions of source code must retain the above copyright 14 * notice, this list of conditions and the following disclaimer. 15 * 2. Redistributions in binary form must reproduce the above copyright 16 * notice, this list of conditions and the following disclaimer in the 17 * documentation and/or other materials provided with the distribution. 18 * 4. Neither the name of the University nor the names of its contributors 19 * may be used to endorse or promote products derived from this software 20 * without specific prior written permission. 21 * 22 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND 23 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 24 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 25 * ARE DISCLAIMED. IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE 26 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 27 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 28 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 29 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 30 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 31 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 32 * SUCH DAMAGE. 33 */ 34 35 #include "lint.h" 36 #include <ctype.h> 37 #include <wchar.h> 38 #include "runetype.h" 39 #include "mblocal.h" 40 #include "_ctype.h" 41 42 #define _DEFRUNETYPE { \ 43 /* 00 */ \ 44 _CTYPE_C, \ 45 _CTYPE_C, \ 46 _CTYPE_C, \ 47 _CTYPE_C, \ 48 _CTYPE_C, \ 49 _CTYPE_C, \ 50 _CTYPE_C, \ 51 _CTYPE_C, \ 52 /* 08 */ \ 53 _CTYPE_C, \ 54 _CTYPE_C|_CTYPE_S|_CTYPE_B, \ 55 _CTYPE_C|_CTYPE_S, \ 56 _CTYPE_C|_CTYPE_S, \ 57 _CTYPE_C|_CTYPE_S, \ 58 _CTYPE_C|_CTYPE_S, \ 59 _CTYPE_C, \ 60 _CTYPE_C, \ 61 /* 10 */ \ 62 _CTYPE_C, \ 63 _CTYPE_C, \ 64 _CTYPE_C, \ 65 _CTYPE_C, \ 66 _CTYPE_C, \ 67 _CTYPE_C, \ 68 _CTYPE_C, \ 69 _CTYPE_C, \ 70 /* 18 */ \ 71 _CTYPE_C, \ 72 _CTYPE_C, \ 73 _CTYPE_C, \ 74 _CTYPE_C, \ 75 _CTYPE_C, \ 76 _CTYPE_C, \ 77 _CTYPE_C, \ 78 _CTYPE_C, \ 79 /* 20 */ \ 80 _CTYPE_S|_CTYPE_B|_CTYPE_R, \ 81 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 82 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 83 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 84 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 85 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 86 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 87 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 88 /* 28 */ \ 89 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 90 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 91 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 92 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 93 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 94 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 95 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 96 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 97 /* 30 */ \ 98 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 99 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 100 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 101 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 102 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 103 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 104 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 105 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 106 /* 38 */ \ 107 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 108 _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \ 109 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 110 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 111 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 112 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 113 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 114 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 115 /* 40 */ \ 116 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 117 _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 118 _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 119 _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 120 _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 121 _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 122 _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 123 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 124 /* 48 */ \ 125 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 126 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 127 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 128 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 129 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 130 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 131 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 132 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 133 /* 50 */ \ 134 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 135 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 136 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 137 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 138 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 139 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 140 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 141 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 142 /* 58 */ \ 143 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 144 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 145 _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 146 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 147 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 148 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 149 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 150 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 151 /* 60 */ \ 152 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 153 _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 154 _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 155 _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 156 _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 157 _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 158 _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 159 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 160 /* 68 */ \ 161 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 162 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 163 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 164 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 165 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 166 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 167 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 168 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 169 /* 70 */ \ 170 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 171 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 172 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 173 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 174 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 175 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 176 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 177 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 178 /* 78 */ \ 179 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 180 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 181 _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \ 182 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 183 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 184 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 185 _CTYPE_P|_CTYPE_R|_CTYPE_G, \ 186 _CTYPE_C, \ 187 } 188 189 #define _DEFMAPLOWER { \ 190 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, \ 191 0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f, \ 192 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, \ 193 0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f, \ 194 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, \ 195 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f, \ 196 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, \ 197 0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f, \ 198 0x40, 'a', 'b', 'c', 'd', 'e', 'f', 'g', \ 199 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', \ 200 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', \ 201 'x', 'y', 'z', 0x5b, 0x5c, 0x5d, 0x5e, 0x5f, \ 202 0x60, 'a', 'b', 'c', 'd', 'e', 'f', 'g', \ 203 'h', 'i', 'j', 'k', 'l', 'm', 'n', 'o', \ 204 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', \ 205 'x', 'y', 'z', 0x7b, 0x7c, 0x7d, 0x7e, 0x7f, \ 206 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, \ 207 0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, \ 208 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, \ 209 0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f, \ 210 0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, \ 211 0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf, \ 212 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7, \ 213 0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, \ 214 0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7, \ 215 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, \ 216 0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, \ 217 0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf, \ 218 0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, \ 219 0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, \ 220 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, \ 221 0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff, \ 222 } 223 224 #define _DEFMAPUPPER { \ 225 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, \ 226 0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f, \ 227 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, \ 228 0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f, \ 229 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, \ 230 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f, \ 231 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, \ 232 0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f, \ 233 0x40, 'A', 'B', 'C', 'D', 'E', 'F', 'G', \ 234 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', \ 235 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', \ 236 'X', 'Y', 'Z', 0x5b, 0x5c, 0x5d, 0x5e, 0x5f, \ 237 0x60, 'A', 'B', 'C', 'D', 'E', 'F', 'G', \ 238 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', \ 239 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', \ 240 'X', 'Y', 'Z', 0x7b, 0x7c, 0x7d, 0x7e, 0x7f, \ 241 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, \ 242 0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, \ 243 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, \ 244 0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f, \ 245 0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, \ 246 0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf, \ 247 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7, \ 248 0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, \ 249 0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7, \ 250 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, \ 251 0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, \ 252 0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf, \ 253 0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, \ 254 0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, \ 255 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, \ 256 0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff, \ 257 } 258 259 _RuneLocale _DefaultRuneLocale = { 260 _RUNE_MAGIC_1, 261 "NONE", 262 _DEFRUNETYPE, 263 _DEFMAPLOWER, 264 _DEFMAPUPPER, 265 }; 266 267 /* 268 * __ctype_mask, __trans_lower, and __trans_upper come from former _ctype.c and 269 * have to stay pointers for binary compatibility, so we provide separate 270 * storage for them, initialized to "C" locale contents by default. 271 */ 272 static unsigned int ___ctype_mask[_CACHED_RUNES] = _DEFRUNETYPE; 273 unsigned int *__ctype_mask = ___ctype_mask; 274 275 static int ___trans_lower[_CACHED_RUNES] = _DEFMAPLOWER; 276 int *__trans_lower = ___trans_lower; 277 278 static int ___trans_upper[_CACHED_RUNES] = _DEFMAPUPPER; 279 int *__trans_upper = ___trans_upper;