tor-browser

The Tor Browser
git clone https://git.dasho.dev/tor-browser.git
Log | Files | Refs | README | LICENSE

hb-ot-shaper-indic-machine.rl (4399B)


      1 /*
      2 * Copyright © 2011,2012  Google, Inc.
      3 *
      4 *  This is part of HarfBuzz, a text shaping library.
      5 *
      6 * Permission is hereby granted, without written agreement and without
      7 * license or royalty fees, to use, copy, modify, and distribute this
      8 * software and its documentation for any purpose, provided that the
      9 * above copyright notice and the following two paragraphs appear in
     10 * all copies of this software.
     11 *
     12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR
     13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES
     14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN
     15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH
     16 * DAMAGE.
     17 *
     18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING,
     19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND
     20 * FITNESS FOR A PARTICULAR PURPOSE.  THE SOFTWARE PROVIDED HEREUNDER IS
     21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO
     22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS.
     23 *
     24 * Google Author(s): Behdad Esfahbod
     25 */
     26 
     27 #ifndef HB_OT_SHAPER_INDIC_MACHINE_HH
     28 #define HB_OT_SHAPER_INDIC_MACHINE_HH
     29 
     30 #include "hb.hh"
     31 
     32 #include "hb-ot-layout.hh"
     33 #include "hb-ot-shaper-indic.hh"
     34 
     35 /* buffer var allocations */
     36 #define indic_category() ot_shaper_var_u8_category() /* indic_category_t */
     37 #define indic_position() ot_shaper_var_u8_auxiliary() /* indic_position_t */
     38 
     39 using indic_category_t = unsigned;
     40 using indic_position_t = ot_position_t;
     41 
     42 #define I_Cat(Cat) indic_syllable_machine_ex_##Cat
     43 
     44 enum indic_syllable_type_t {
     45  indic_consonant_syllable,
     46  indic_vowel_syllable,
     47  indic_standalone_cluster,
     48  indic_symbol_cluster,
     49  indic_broken_cluster,
     50  indic_non_indic_cluster,
     51 };
     52 
     53 %%{
     54  machine indic_syllable_machine;
     55  alphtype unsigned char;
     56  write exports;
     57  write data;
     58 }%%
     59 
     60 %%{
     61 
     62 
     63 export X    = 0;
     64 export C    = 1;
     65 export V    = 2;
     66 export N    = 3;
     67 export H    = 4;
     68 export ZWNJ = 5;
     69 export ZWJ  = 6;
     70 export M    = 7;
     71 export SM   = 8;
     72 export A    = 9;
     73 export VD   = 9;
     74 export PLACEHOLDER = 10;
     75 export DOTTEDCIRCLE = 11;
     76 export RS    = 12;
     77 export MPst  = 13;
     78 export Repha = 14;
     79 export Ra    = 15;
     80 export CM    = 16;
     81 export Symbol= 17;
     82 export CS    = 18;
     83 export SMPst = 57;
     84 
     85 
     86 c = (C | Ra);			# is_consonant
     87 n = ((ZWNJ?.RS)? (N.N?)?);	# is_consonant_modifier
     88 z = ZWJ|ZWNJ;			# is_joiner
     89 reph = (Ra H | Repha);		# possible reph
     90 sm = SM | SMPst;
     91 
     92 cn = c.ZWJ?.n?;
     93 symbol = Symbol.N?;
     94 matra_group = z*.(M | sm? MPst).N?.H?;
     95 syllable_tail = (z?.sm.sm?.ZWNJ?)? (A | VD)*;
     96 halant_group = (z?.H.(ZWJ.N?)?);
     97 final_halant_group = halant_group | H.ZWNJ;
     98 medial_group = CM?;
     99 halant_or_matra_group = (final_halant_group | matra_group*);
    100 
    101 complex_syllable_tail = (halant_group.cn)* medial_group halant_or_matra_group syllable_tail;
    102 
    103 consonant_syllable =	(Repha|CS)? cn complex_syllable_tail;
    104 vowel_syllable =	reph? V.n? (ZWJ | complex_syllable_tail);
    105 standalone_cluster =	((Repha|CS)? PLACEHOLDER | reph? DOTTEDCIRCLE).n? complex_syllable_tail;
    106 symbol_cluster =	symbol syllable_tail;
    107 broken_cluster =	reph? n? complex_syllable_tail;
    108 other =			any;
    109 
    110 main := |*
    111 consonant_syllable	=> { found_syllable (indic_consonant_syllable); };
    112 vowel_syllable		=> { found_syllable (indic_vowel_syllable); };
    113 standalone_cluster	=> { found_syllable (indic_standalone_cluster); };
    114 symbol_cluster		=> { found_syllable (indic_symbol_cluster); };
    115 SMPst			=> { found_syllable (indic_non_indic_cluster); };
    116 broken_cluster		=> { found_syllable (indic_broken_cluster); buffer->scratch_flags |= HB_BUFFER_SCRATCH_FLAG_HAS_BROKEN_SYLLABLE; };
    117 other			=> { found_syllable (indic_non_indic_cluster); };
    118 *|;
    119 
    120 
    121 }%%
    122 
    123 #define found_syllable(syllable_type) \
    124  HB_STMT_START { \
    125    if (0) fprintf (stderr, "syllable %u..%u %s\n", ts, te, #syllable_type); \
    126    for (unsigned int i = ts; i < te; i++) \
    127      info[i].syllable() = (syllable_serial << 4) | syllable_type; \
    128    syllable_serial++; \
    129    if (syllable_serial == 16) syllable_serial = 1; \
    130  } HB_STMT_END
    131 
    132 inline void
    133 find_syllables_indic (hb_buffer_t *buffer)
    134 {
    135  unsigned int p, pe, eof, ts, te, act;
    136  int cs;
    137  hb_glyph_info_t *info = buffer->info;
    138  %%{
    139    write init;
    140    getkey info[p].indic_category();
    141  }%%
    142 
    143  p = 0;
    144  pe = eof = buffer->len;
    145 
    146  unsigned int syllable_serial = 1;
    147  %%{
    148    write exec;
    149  }%%
    150 }
    151 
    152 #undef found_syllable
    153 
    154 #endif /* HB_OT_SHAPER_INDIC_MACHINE_HH */