1 /*
   2  * Copyright 2013 Garrett D'Amore <garrett@damore.org>
   3  * Copyright 2017 Nexenta Systems, Inc.
   4  * Copyright (c) 1993
   5  *      The Regents of the University of California.  All rights reserved.
   6  *
   7  * This code is derived from software contributed to Berkeley by
   8  * Paul Borman at Krystal Technologies.
   9  *
  10  * Redistribution and use in source and binary forms, with or without
  11  * modification, are permitted provided that the following conditions
  12  * are met:
  13  * 1. Redistributions of source code must retain the above copyright
  14  *    notice, this list of conditions and the following disclaimer.
  15  * 2. Redistributions in binary form must reproduce the above copyright
  16  *    notice, this list of conditions and the following disclaimer in the
  17  *    documentation and/or other materials provided with the distribution.
  18  * 4. Neither the name of the University nor the names of its contributors
  19  *    may be used to endorse or promote products derived from this software
  20  *    without specific prior written permission.
  21  *
  22  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
  23  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
  26  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  27  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  28  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  29  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  30  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  31  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  32  * SUCH DAMAGE.
  33  */
  34 
  35 #include "lint.h"
  36 #include <ctype.h>
  37 #include <wchar.h>
  38 #include "runetype.h"
  39 #include "mblocal.h"
  40 #include "_ctype.h"
  41 
  42 #define _DEFRUNETYPE { \
  43         /* 00 */ \
  44         _CTYPE_C, \
  45         _CTYPE_C, \
  46         _CTYPE_C, \
  47         _CTYPE_C, \
  48         _CTYPE_C, \
  49         _CTYPE_C, \
  50         _CTYPE_C, \
  51         _CTYPE_C, \
  52         /* 08 */ \
  53         _CTYPE_C, \
  54         _CTYPE_C|_CTYPE_S|_CTYPE_B, \
  55         _CTYPE_C|_CTYPE_S, \
  56         _CTYPE_C|_CTYPE_S, \
  57         _CTYPE_C|_CTYPE_S, \
  58         _CTYPE_C|_CTYPE_S, \
  59         _CTYPE_C, \
  60         _CTYPE_C, \
  61         /* 10 */ \
  62         _CTYPE_C, \
  63         _CTYPE_C, \
  64         _CTYPE_C, \
  65         _CTYPE_C, \
  66         _CTYPE_C, \
  67         _CTYPE_C, \
  68         _CTYPE_C, \
  69         _CTYPE_C, \
  70         /* 18 */ \
  71         _CTYPE_C, \
  72         _CTYPE_C, \
  73         _CTYPE_C, \
  74         _CTYPE_C, \
  75         _CTYPE_C, \
  76         _CTYPE_C, \
  77         _CTYPE_C, \
  78         _CTYPE_C, \
  79         /* 20 */ \
  80         _CTYPE_S|_CTYPE_B|_CTYPE_R, \
  81         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  82         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  83         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  84         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  85         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  86         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  87         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  88         /* 28 */ \
  89         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  90         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  91         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  92         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  93         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  94         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  95         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  96         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
  97         /* 30 */ \
  98         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
  99         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 100         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 101         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 102         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 103         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 104         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 105         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 106         /* 38 */ \
 107         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 108         _CTYPE_D|_CTYPE_R|_CTYPE_G|_CTYPE_X, \
 109         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 110         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 111         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 112         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 113         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 114         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 115         /* 40 */ \
 116         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 117         _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 118         _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 119         _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 120         _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 121         _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 122         _CTYPE_U|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 123         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 124         /* 48 */ \
 125         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 126         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 127         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 128         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 129         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 130         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 131         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 132         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 133         /* 50 */ \
 134         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 135         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 136         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 137         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 138         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 139         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 140         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 141         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 142         /* 58 */ \
 143         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 144         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 145         _CTYPE_U|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 146         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 147         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 148         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 149         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 150         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 151         /* 60 */ \
 152         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 153         _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 154         _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 155         _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 156         _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 157         _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 158         _CTYPE_L|_CTYPE_X|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 159         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 160         /* 68 */ \
 161         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 162         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 163         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 164         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 165         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 166         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 167         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 168         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 169         /* 70 */ \
 170         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 171         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 172         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 173         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 174         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 175         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 176         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 177         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 178         /* 78 */ \
 179         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 180         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 181         _CTYPE_L|_CTYPE_R|_CTYPE_G|_CTYPE_A, \
 182         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 183         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 184         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 185         _CTYPE_P|_CTYPE_R|_CTYPE_G, \
 186         _CTYPE_C, \
 187 }
 188 
 189 #define _DEFMAPLOWER { \
 190         0x00,   0x01,   0x02,   0x03,   0x04,   0x05,   0x06,   0x07, \
 191         0x08,   0x09,   0x0a,   0x0b,   0x0c,   0x0d,   0x0e,   0x0f, \
 192         0x10,   0x11,   0x12,   0x13,   0x14,   0x15,   0x16,   0x17, \
 193         0x18,   0x19,   0x1a,   0x1b,   0x1c,   0x1d,   0x1e,   0x1f, \
 194         0x20,   0x21,   0x22,   0x23,   0x24,   0x25,   0x26,   0x27, \
 195         0x28,   0x29,   0x2a,   0x2b,   0x2c,   0x2d,   0x2e,   0x2f, \
 196         0x30,   0x31,   0x32,   0x33,   0x34,   0x35,   0x36,   0x37, \
 197         0x38,   0x39,   0x3a,   0x3b,   0x3c,   0x3d,   0x3e,   0x3f, \
 198         0x40,   'a',    'b',    'c',    'd',    'e',    'f',    'g', \
 199         'h',    'i',    'j',    'k',    'l',    'm',    'n',    'o', \
 200         'p',    'q',    'r',    's',    't',    'u',    'v',    'w', \
 201         'x',    'y',    'z',    0x5b,   0x5c,   0x5d,   0x5e,   0x5f, \
 202         0x60,   'a',    'b',    'c',    'd',    'e',    'f',    'g', \
 203         'h',    'i',    'j',    'k',    'l',    'm',    'n',    'o', \
 204         'p',    'q',    'r',    's',    't',    'u',    'v',    'w', \
 205         'x',    'y',    'z',    0x7b,   0x7c,   0x7d,   0x7e,   0x7f, \
 206         0x80,   0x81,   0x82,   0x83,   0x84,   0x85,   0x86,   0x87, \
 207         0x88,   0x89,   0x8a,   0x8b,   0x8c,   0x8d,   0x8e,   0x8f, \
 208         0x90,   0x91,   0x92,   0x93,   0x94,   0x95,   0x96,   0x97, \
 209         0x98,   0x99,   0x9a,   0x9b,   0x9c,   0x9d,   0x9e,   0x9f, \
 210         0xa0,   0xa1,   0xa2,   0xa3,   0xa4,   0xa5,   0xa6,   0xa7, \
 211         0xa8,   0xa9,   0xaa,   0xab,   0xac,   0xad,   0xae,   0xaf, \
 212         0xb0,   0xb1,   0xb2,   0xb3,   0xb4,   0xb5,   0xb6,   0xb7, \
 213         0xb8,   0xb9,   0xba,   0xbb,   0xbc,   0xbd,   0xbe,   0xbf, \
 214         0xc0,   0xc1,   0xc2,   0xc3,   0xc4,   0xc5,   0xc6,   0xc7, \
 215         0xc8,   0xc9,   0xca,   0xcb,   0xcc,   0xcd,   0xce,   0xcf, \
 216         0xd0,   0xd1,   0xd2,   0xd3,   0xd4,   0xd5,   0xd6,   0xd7, \
 217         0xd8,   0xd9,   0xda,   0xdb,   0xdc,   0xdd,   0xde,   0xdf, \
 218         0xe0,   0xe1,   0xe2,   0xe3,   0xe4,   0xe5,   0xe6,   0xe7, \
 219         0xe8,   0xe9,   0xea,   0xeb,   0xec,   0xed,   0xee,   0xef, \
 220         0xf0,   0xf1,   0xf2,   0xf3,   0xf4,   0xf5,   0xf6,   0xf7, \
 221         0xf8,   0xf9,   0xfa,   0xfb,   0xfc,   0xfd,   0xfe,   0xff, \
 222 }
 223 
 224 #define _DEFMAPUPPER { \
 225         0x00,   0x01,   0x02,   0x03,   0x04,   0x05,   0x06,   0x07, \
 226         0x08,   0x09,   0x0a,   0x0b,   0x0c,   0x0d,   0x0e,   0x0f, \
 227         0x10,   0x11,   0x12,   0x13,   0x14,   0x15,   0x16,   0x17, \
 228         0x18,   0x19,   0x1a,   0x1b,   0x1c,   0x1d,   0x1e,   0x1f, \
 229         0x20,   0x21,   0x22,   0x23,   0x24,   0x25,   0x26,   0x27, \
 230         0x28,   0x29,   0x2a,   0x2b,   0x2c,   0x2d,   0x2e,   0x2f, \
 231         0x30,   0x31,   0x32,   0x33,   0x34,   0x35,   0x36,   0x37, \
 232         0x38,   0x39,   0x3a,   0x3b,   0x3c,   0x3d,   0x3e,   0x3f, \
 233         0x40,   'A',    'B',    'C',    'D',    'E',    'F',    'G', \
 234         'H',    'I',    'J',    'K',    'L',    'M',    'N',    'O', \
 235         'P',    'Q',    'R',    'S',    'T',    'U',    'V',    'W', \
 236         'X',    'Y',    'Z',    0x5b,   0x5c,   0x5d,   0x5e,   0x5f, \
 237         0x60,   'A',    'B',    'C',    'D',    'E',    'F',    'G', \
 238         'H',    'I',    'J',    'K',    'L',    'M',    'N',    'O', \
 239         'P',    'Q',    'R',    'S',    'T',    'U',    'V',    'W', \
 240         'X',    'Y',    'Z',    0x7b,   0x7c,   0x7d,   0x7e,   0x7f, \
 241         0x80,   0x81,   0x82,   0x83,   0x84,   0x85,   0x86,   0x87, \
 242         0x88,   0x89,   0x8a,   0x8b,   0x8c,   0x8d,   0x8e,   0x8f, \
 243         0x90,   0x91,   0x92,   0x93,   0x94,   0x95,   0x96,   0x97, \
 244         0x98,   0x99,   0x9a,   0x9b,   0x9c,   0x9d,   0x9e,   0x9f, \
 245         0xa0,   0xa1,   0xa2,   0xa3,   0xa4,   0xa5,   0xa6,   0xa7, \
 246         0xa8,   0xa9,   0xaa,   0xab,   0xac,   0xad,   0xae,   0xaf, \
 247         0xb0,   0xb1,   0xb2,   0xb3,   0xb4,   0xb5,   0xb6,   0xb7, \
 248         0xb8,   0xb9,   0xba,   0xbb,   0xbc,   0xbd,   0xbe,   0xbf, \
 249         0xc0,   0xc1,   0xc2,   0xc3,   0xc4,   0xc5,   0xc6,   0xc7, \
 250         0xc8,   0xc9,   0xca,   0xcb,   0xcc,   0xcd,   0xce,   0xcf, \
 251         0xd0,   0xd1,   0xd2,   0xd3,   0xd4,   0xd5,   0xd6,   0xd7, \
 252         0xd8,   0xd9,   0xda,   0xdb,   0xdc,   0xdd,   0xde,   0xdf, \
 253         0xe0,   0xe1,   0xe2,   0xe3,   0xe4,   0xe5,   0xe6,   0xe7, \
 254         0xe8,   0xe9,   0xea,   0xeb,   0xec,   0xed,   0xee,   0xef, \
 255         0xf0,   0xf1,   0xf2,   0xf3,   0xf4,   0xf5,   0xf6,   0xf7, \
 256         0xf8,   0xf9,   0xfa,   0xfb,   0xfc,   0xfd,   0xfe,   0xff, \
 257 }
 258 
 259 _RuneLocale _DefaultRuneLocale = {
 260         _RUNE_MAGIC_1,
 261         "NONE",
 262         _DEFRUNETYPE,
 263         _DEFMAPLOWER,
 264         _DEFMAPUPPER,
 265 };
 266 
 267 /*
 268  * __ctype_mask, __trans_lower, and __trans_upper come from former _ctype.c and
 269  * have to stay pointers for binary compatibility, so we provide separate
 270  * storage for them, initialized to "C" locale contents by default.
 271  */
 272 static unsigned int ___ctype_mask[_CACHED_RUNES] = _DEFRUNETYPE;
 273 unsigned int *__ctype_mask = ___ctype_mask;
 274 
 275 static int ___trans_lower[_CACHED_RUNES] = _DEFMAPLOWER;
 276 int *__trans_lower = ___trans_lower;
 277 
 278 static int ___trans_upper[_CACHED_RUNES] = _DEFMAPUPPER;
 279 int *__trans_upper = ___trans_upper;