1 /*
   2  * Copyright 2010 Nexenta Systmes, Inc.  All rights reserved.
   3  * Copyright (c) 1995 Alex Tatmanjants <alex@elvisti.kiev.ua>
   4  *              at Electronni Visti IA, Kiev, Ukraine.
   5  *                      All rights reserved.
   6  *
   7  * Redistribution and use in source and binary forms, with or without
   8  * modification, are permitted provided that the following conditions
   9  * are met:
  10  * 1. Redistributions of source code must retain the above copyright
  11  *    notice, this list of conditions and the following disclaimer.
  12  * 2. Redistributions in binary form must reproduce the above copyright
  13  *    notice, this list of conditions and the following disclaimer in the
  14  *    documentation and/or other materials provided with the distribution.
  15  *
  16  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND
  17  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  18  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  19  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR BE LIABLE
  20  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
  21  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
  22  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
  23  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
  24  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
  25  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
  26  * SUCH DAMAGE.
  27  */
  28 
  29 #ifndef _COLLATE_H_
  30 #define _COLLATE_H_
  31 
  32 #include <sys/types.h>
  33 #include <limits.h>
  34 
  35 #define COLLATE_STR_LEN         24              /* should be 64-bit multiple */
  36 #define COLLATE_VERSION         "IllumosCollate2\n"
  37 
  38 #define COLLATE_MAX_PRIORITY    (0x7fffffff)    /* max signed value */
  39 #define COLLATE_SUBST_PRIORITY  (0x40000000)    /* bit indicates subst table */
  40 
  41 #define DIRECTIVE_UNDEF         0x00
  42 #define DIRECTIVE_FORWARD       0x01
  43 #define DIRECTIVE_BACKWARD      0x02
  44 #define DIRECTIVE_POSITION      0x04
  45 #define DIRECTIVE_UNDEFINED     0x08    /* special last weight for UNDEFINED */
  46 
  47 #define DIRECTIVE_DIRECTION_MASK (DIRECTIVE_FORWARD | DIRECTIVE_BACKWARD)
  48 
  49 /*
  50  * The collate file format is as follows:
  51  *
  52  * char         version[COLLATE_STR_LEN];       // must be COLLATE_VERSION
  53  * collate_info_t       info;                   // see below, includes padding
  54  * collate_char_pri_t   char_data[256];         // 8 bit char values
  55  * collate_subst_t      subst[*];               // 0 or more substitutions
  56  * collate_chain_pri_t  chains[*];              // 0 or more chains
  57  * collate_large_pri_t  large[*];               // extended char priorities
  58  *
  59  * Note that all structures must be 32-bit aligned, as each structure
  60  * contains 32-bit member fields.  The entire file is mmap'd, so its
  61  * critical that alignment be observed.  It is not generally safe to
  62  * use any 64-bit values in the structures.
  63  */
  64 
  65 typedef struct collate_info {
  66         uint8_t directive_count;
  67         uint8_t directive[COLL_WEIGHTS_MAX];
  68         int32_t pri_count[COLL_WEIGHTS_MAX];
  69         int32_t flags;
  70         int32_t chain_count;
  71         int32_t large_count;
  72         int32_t subst_count[COLL_WEIGHTS_MAX];
  73         int32_t undef_pri[COLL_WEIGHTS_MAX];
  74 } collate_info_t;
  75 
  76 typedef struct collate_char {
  77         int32_t pri[COLL_WEIGHTS_MAX];
  78 } collate_char_t;
  79 
  80 typedef struct collate_chain {
  81         wchar_t str[COLLATE_STR_LEN];
  82         int32_t pri[COLL_WEIGHTS_MAX];
  83 } collate_chain_t;
  84 
  85 typedef struct collate_large {
  86         int32_t val;
  87         collate_char_t pri;
  88 } collate_large_t;
  89 
  90 typedef struct collate_subst {
  91         int32_t key;
  92         int32_t pri[COLLATE_STR_LEN];
  93 } collate_subst_t;
  94 
  95 int     _collate_load_tables(const char *);
  96 void    _collate_lookup(const wchar_t *, int *, int *, int, int **);
  97 size_t  _collate_wxfrm(const wchar_t *, wchar_t *, size_t);
  98 size_t  _collate_sxfrm(const wchar_t *, char *, size_t);
  99 int     _collate_range_cmp(wchar_t, wchar_t);
 100 
 101 extern int _collate_load_error;
 102 extern int _collate_substitute_nontrivial;
 103 extern collate_info_t *_collate_info;
 104 
 105 #endif /* !_COLLATE_H_ */