tor-browser

The Tor Browser
git clone https://git.dasho.dev/tor-browser.git
Log | Files | Refs | README | LICENSE

ucol_data.h (4488B)


      1 // © 2016 and later: Unicode, Inc. and others.
      2 // License & terms of use: http://www.unicode.org/copyright.html
      3 /*
      4 *******************************************************************************
      5 *   Copyright (C) 2000-2011, International Business Machines
      6 *   Corporation and others.  All Rights Reserved.
      7 *******************************************************************************
      8 *   file name:  ucol_data.h
      9 *   encoding:   UTF-8
     10 *   tab size:   8 (not used)
     11 *   indentation:4
     12 *
     13 *   created on: 2011jul02
     14 *   created by: Markus Scherer
     15 *
     16 * Private implementation header for C/C++ collation.
     17 * Some file data structure definitions were moved here from i18n/ucol_imp.h
     18 * so that the common library (via ucol_swp.cpp) need not depend on the i18n library at all.
     19 *
     20 * We do not want to move the collation swapper to the i18n library because
     21 * a) the resource bundle swapper depends on it and would have to move too, and
     22 * b) we might want to eventually implement runtime data swapping,
     23 *    which might (or might not) be easier if all swappers are in the common library.
     24 */
     25 
     26 #ifndef __UCOL_DATA_H__
     27 #define __UCOL_DATA_H__
     28 
     29 #include "unicode/utypes.h"
     30 
     31 #if !UCONFIG_NO_COLLATION
     32 
     33 /* let us know whether reserved fields are reset to zero or junked */
     34 #define UCOL_HEADER_MAGIC 0x20030618
     35 
     36 typedef struct {
     37      int32_t size;
     38      /* all the offsets are in bytes */
     39      /* to get the address add to the header address and cast properly */
     40      uint32_t options; /* these are the default options for the collator */
     41      uint32_t UCAConsts; /* structure which holds values for indirect positioning and implicit ranges */
     42      uint32_t contractionUCACombos;        /* this one is needed only for UCA, to copy the appropriate contractions */
     43      uint32_t magic;            /* magic number - lets us know whether reserved data is reset or junked */
     44      uint32_t mappingPosition;  /* const uint8_t *mappingPosition; */
     45      uint32_t expansion;        /* uint32_t *expansion;            */
     46      uint32_t contractionIndex; /* char16_t *contractionIndex;        */
     47      uint32_t contractionCEs;   /* uint32_t *contractionCEs;       */
     48      uint32_t contractionSize;  /* needed for various closures */
     49      /*int32_t latinOneMapping;*/ /* this is now handled in the trie itself *//* fast track to latin1 chars      */
     50 
     51      uint32_t endExpansionCE;      /* array of last collation element in
     52                                       expansion */
     53      uint32_t expansionCESize;     /* array of maximum expansion size
     54                                       corresponding to the expansion
     55                                       collation elements with last element
     56                                       in endExpansionCE*/
     57      int32_t  endExpansionCECount; /* size of endExpansionCE */
     58      uint32_t unsafeCP;            /* hash table of unsafe code points */
     59      uint32_t contrEndCP;          /* hash table of final code points  */
     60                                    /*   in contractions.               */
     61 
     62      int32_t contractionUCACombosSize;     /* number of UCA contraction items. */
     63                                            /*Length is contractionUCACombosSize*contractionUCACombosWidth*sizeof(char16_t) */
     64      UBool jamoSpecial;                    /* is jamoSpecial */
     65      UBool isBigEndian;                    /* is this data big endian? from the UDataInfo header*/
     66      uint8_t charSetFamily;                /* what is the charset family of this data from the UDataInfo header*/
     67      uint8_t contractionUCACombosWidth;    /* width of UCA combos field */
     68      UVersionInfo version;
     69      UVersionInfo UCAVersion;              /* version of the UCA, read from file */
     70      UVersionInfo UCDVersion;              /* UCD version, obtained by u_getUnicodeVersion */
     71      UVersionInfo formatVersion;           /* format version from the UDataInfo header */
     72      uint32_t scriptToLeadByte;            /* offset to script to lead collation byte mapping data */
     73      uint32_t leadByteToScript;            /* offset to lead collation byte to script mapping data */
     74      uint8_t reserved[76];                 /* for future use */
     75 } UCATableHeader;
     76 
     77 typedef struct {
     78  uint32_t byteSize;
     79  uint32_t tableSize;
     80  uint32_t contsSize;
     81  uint32_t table;
     82  uint32_t conts;
     83  UVersionInfo UCAVersion;              /* version of the UCA, read from file */
     84  uint8_t padding[8];
     85 } InverseUCATableHeader;
     86 
     87 #endif  /* !UCONFIG_NO_COLLATION */
     88 
     89 #endif  /* __UCOL_DATA_H__ */