Home | History | Annotate | Download | only in layout
      1 /*
      2  *
      3  * (C) Copyright IBM Corp. 1998-2004 - All Rights Reserved
      4  *
      5  */
      6 
      7 #include "LETypes.h"
      8 #include "LEGlyphFilter.h"
      9 #include "OpenTypeTables.h"
     10 #include "LEGlyphStorage.h"
     11 #include "ThaiShaping.h"
     12 
     13 U_NAMESPACE_BEGIN
     14 
     15 enum {
     16     CH_SPACE        = 0x0020,
     17     CH_YAMAKKAN     = 0x0E4E,
     18     CH_MAI_HANAKAT  = 0x0E31,
     19     CH_SARA_AA      = 0x0E32,
     20     CH_SARA_AM      = 0x0E33,
     21     CH_SARA_UEE     = 0x0E37,
     22     CH_MAITAIKHU    = 0x0E47,
     23     CH_NIKHAHIT     = 0x0E4D,
     24     CH_SARA_U       = 0x0E38,
     25     CH_PHINTHU      = 0x0E3A,
     26     CH_YO_YING      = 0x0E0D,
     27     CH_THO_THAN     = 0x0E10,
     28     CH_DOTTED_CIRCLE = 0x25CC
     29 };
     30 
     31     le_uint8 ThaiShaping::getCharClass(LEUnicode ch)
     32 {
     33     le_uint8 charClass = NON;
     34 
     35     if (ch >= 0x0E00 && ch <= 0x0E5B) {
     36         charClass = classTable[ch - 0x0E00];
     37     }
     38 
     39     return charClass;
     40 }
     41 
     42 
     43 LEUnicode ThaiShaping::leftAboveVowel(LEUnicode vowel, le_uint8 glyphSet)
     44 {
     45     static const LEUnicode leftAboveVowels[][7] = {
     46         {0x0E61, 0x0E32, 0x0E33, 0x0E64, 0x0E65, 0x0E66, 0x0E67},
     47         {0xF710, 0x0E32, 0x0E33, 0xF701, 0xF702, 0xF703, 0xF704},
     48         {0xF884, 0x0E32, 0x0E33, 0xF885, 0xF886, 0xF887, 0xF788},
     49         {0x0E31, 0x0E32, 0x0E33, 0x0E34, 0x0E35, 0x0E36, 0x0E37}
     50     };
     51 
     52     if (vowel >= CH_MAI_HANAKAT && vowel <= CH_SARA_UEE) {
     53         return leftAboveVowels[glyphSet][vowel - CH_MAI_HANAKAT];
     54     }
     55 
     56     if (vowel == CH_YAMAKKAN && glyphSet == 0) {
     57         return 0x0E7E;
     58     }
     59 
     60     return vowel;
     61 }
     62 
     63 LEUnicode ThaiShaping::lowerRightTone(LEUnicode tone, le_uint8 glyphSet)
     64 {
     65     static const LEUnicode lowerRightTones[][7] = {
     66         {0x0E68, 0x0E69, 0x0E6A, 0x0E6B, 0x0E6C, 0x0E6D, 0x0E6E},
     67         {0x0E47, 0xF70A, 0xF70B, 0xF70C, 0xF70D, 0xF70E, 0x0E4D},
     68         {0x0E47, 0xF88B, 0xF88E, 0xF891, 0xF894, 0xF897, 0x0E4D},
     69         {0x0E47, 0x0E48, 0x0E49, 0x0E4A, 0x0E4B, 0x0E4C, 0x0E4D}
     70     };
     71 
     72     if (tone >= CH_MAITAIKHU && tone <= CH_NIKHAHIT) {
     73         return lowerRightTones[glyphSet][tone - CH_MAITAIKHU];
     74     }
     75 
     76     return tone;
     77 }
     78 
     79 LEUnicode ThaiShaping::lowerLeftTone(LEUnicode tone, le_uint8 glyphSet)
     80 {
     81     static const LEUnicode lowerLeftTones[][7] = {
     82         {0x0E76, 0x0E77, 0x0E78, 0x0E79, 0x0E7A, 0x0E7B, 0x0E7C},
     83         {0xF712, 0xF705, 0xF706, 0xF707, 0xF708, 0xF709, 0xF711},
     84         {0xF889, 0xF88C, 0xF88F, 0xF892, 0xF895, 0xF898, 0xF899},
     85         {0x0E47, 0x0E48, 0x0E49, 0x0E4A, 0x0E4B, 0x0E4C, 0x0E4D}
     86     };
     87 
     88     if (tone >= CH_MAITAIKHU && tone <= CH_NIKHAHIT) {
     89         return lowerLeftTones[glyphSet][tone - CH_MAITAIKHU];
     90     }
     91 
     92     return tone;
     93 }
     94 
     95 LEUnicode ThaiShaping::upperLeftTone(LEUnicode tone, le_uint8 glyphSet)
     96 {
     97     static const LEUnicode upperLeftTones[][7] = {
     98         {0x0E6F, 0x0E70, 0x0E71, 0x0E72, 0x0E73, 0x0E74, 0x0E75},
     99         {0xF712, 0xF713, 0xF714, 0xF715, 0xF716, 0xF717, 0xF711},
    100         {0xF889, 0xF88A, 0xF88D, 0xF890, 0xF893, 0xF896, 0xF899},
    101         {0x0E47, 0x0E48, 0x0E49, 0x0E4A, 0x0E4B, 0x0E4C, 0x0E4D}
    102     };
    103 
    104     if (tone >= CH_MAITAIKHU && tone <= CH_NIKHAHIT) {
    105         return upperLeftTones[glyphSet][tone - CH_MAITAIKHU];
    106     }
    107 
    108     return tone;
    109 }
    110 
    111 LEUnicode ThaiShaping::lowerBelowVowel(LEUnicode vowel, le_uint8 glyphSet)
    112 {
    113     static const LEUnicode lowerBelowVowels[][3] = {
    114         {0x0E3C, 0x0E3D, 0x0E3E},
    115         {0xF718, 0xF719, 0xF71A},
    116         {0x0E38, 0x0E39, 0x0E3A},
    117         {0x0E38, 0x0E39, 0x0E3A}
    118 
    119     };
    120 
    121     if (vowel >= CH_SARA_U && vowel <= CH_PHINTHU) {
    122         return lowerBelowVowels[glyphSet][vowel - CH_SARA_U];
    123     }
    124 
    125     return vowel;
    126 }
    127 
    128 LEUnicode ThaiShaping::noDescenderCOD(LEUnicode cod, le_uint8 glyphSet)
    129 {
    130     static const LEUnicode noDescenderCODs[][4] = {
    131         {0x0E60, 0x0E0E, 0x0E0F, 0x0E63},
    132         {0xF70F, 0x0E0E, 0x0E0F, 0xF700},
    133         {0x0E0D, 0x0E0E, 0x0E0F, 0x0E10},
    134         {0x0E0D, 0x0E0E, 0x0E0F, 0x0E10}
    135 
    136     };
    137 
    138     if (cod >= CH_YO_YING && cod <= CH_THO_THAN) {
    139         return noDescenderCODs[glyphSet][cod - CH_YO_YING];
    140     }
    141 
    142     return cod;
    143 }
    144 
    145 le_uint8 ThaiShaping::doTransition (StateTransition transition, LEUnicode currChar, le_int32 inputIndex, le_uint8 glyphSet,
    146         LEUnicode errorChar, LEUnicode *outputBuffer, LEGlyphStorage &glyphStorage, le_int32 &outputIndex)
    147 {
    148     LEErrorCode success = LE_NO_ERROR;
    149 
    150     switch (transition.action) {
    151     case tA:
    152         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    153         outputBuffer[outputIndex++] = currChar;
    154         break;
    155 
    156     case tC:
    157         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    158         outputBuffer[outputIndex++] = currChar;
    159         break;
    160 
    161     case tD:
    162         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    163         outputBuffer[outputIndex++] = leftAboveVowel(currChar, glyphSet);
    164         break;
    165 
    166     case tE:
    167         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    168         outputBuffer[outputIndex++] = lowerRightTone(currChar, glyphSet);
    169         break;
    170 
    171     case tF:
    172         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    173         outputBuffer[outputIndex++] = lowerLeftTone(currChar, glyphSet);
    174         break;
    175 
    176     case tG:
    177         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    178         outputBuffer[outputIndex++] = upperLeftTone(currChar, glyphSet);
    179         break;
    180 
    181     case tH:
    182     {
    183         LEUnicode cod = outputBuffer[outputIndex - 1];
    184         LEUnicode coa = noDescenderCOD(cod, glyphSet);
    185 
    186         if (cod != coa) {
    187             outputBuffer[outputIndex - 1] = coa;
    188 
    189             glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    190             outputBuffer[outputIndex++] = currChar;
    191             break;
    192         }
    193 
    194         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    195         outputBuffer[outputIndex++] = lowerBelowVowel(currChar, glyphSet);
    196         break;
    197     }
    198 
    199     case tR:
    200         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    201         outputBuffer[outputIndex++] = errorChar;
    202 
    203         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    204         outputBuffer[outputIndex++] = currChar;
    205         break;
    206 
    207     case tS:
    208         if (currChar == CH_SARA_AM) {
    209             glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    210             outputBuffer[outputIndex++] = errorChar;
    211         }
    212 
    213         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    214         outputBuffer[outputIndex++] = currChar;
    215         break;
    216 
    217     default:
    218         // FIXME: if we get here, there's an error
    219         // in the state table!
    220         glyphStorage.setCharIndex(outputIndex, inputIndex, success);
    221         outputBuffer[outputIndex++] = currChar;
    222         break;
    223      }
    224 
    225      return transition.nextState;
    226 }
    227 
    228 le_uint8 ThaiShaping::getNextState(LEUnicode ch, le_uint8 prevState, le_int32 inputIndex, le_uint8 glyphSet, LEUnicode errorChar,
    229                               le_uint8 &charClass, LEUnicode *output, LEGlyphStorage &glyphStorage, le_int32 &outputIndex)
    230 {
    231     StateTransition transition;
    232 
    233     charClass = getCharClass(ch);
    234     transition = getTransition(prevState, charClass);
    235 
    236     return doTransition(transition, ch, inputIndex, glyphSet, errorChar, output, glyphStorage, outputIndex);
    237 }
    238 
    239 le_bool ThaiShaping::isLegalHere(LEUnicode ch, le_uint8 prevState)
    240 {
    241     le_uint8 charClass = getCharClass(ch);
    242     StateTransition transition = getTransition(prevState, charClass);
    243 
    244     switch (transition.action) {
    245     case tA:
    246     case tC:
    247     case tD:
    248     case tE:
    249     case tF:
    250     case tG:
    251     case tH:
    252         return TRUE;
    253 
    254     case tR:
    255     case tS:
    256         return FALSE;
    257 
    258     default:
    259         // FIXME: if we get here, there's an error
    260         // in the state table!
    261         return FALSE;
    262     }
    263 }
    264 
    265 le_int32 ThaiShaping::compose(const LEUnicode *input, le_int32 offset, le_int32 charCount, le_uint8 glyphSet,
    266                           LEUnicode errorChar, LEUnicode *output, LEGlyphStorage &glyphStorage)
    267 {
    268     le_uint8 state = 0;
    269     le_int32 inputIndex;
    270     le_int32 outputIndex = 0;
    271     le_uint8 conState = 0xFF;
    272     le_int32 conInput = -1;
    273     le_int32 conOutput = -1;
    274 
    275     for (inputIndex = 0; inputIndex < charCount; inputIndex += 1) {
    276         LEUnicode ch = input[inputIndex + offset];
    277         le_uint8 charClass;
    278 
    279         // Decompose SARA AM into NIKHAHIT + SARA AA
    280         if (ch == CH_SARA_AM && isLegalHere(ch, state)) {
    281             outputIndex = conOutput;
    282             state = getNextState(CH_NIKHAHIT, conState, inputIndex, glyphSet, errorChar, charClass,
    283                 output, glyphStorage, outputIndex);
    284 
    285             for (int j = conInput + 1; j < inputIndex; j += 1) {
    286                 ch = input[j + offset];
    287                 state = getNextState(ch, state, j, glyphSet, errorChar, charClass,
    288                     output, glyphStorage, outputIndex);
    289             }
    290 
    291             ch = CH_SARA_AA;
    292         }
    293 
    294         state = getNextState(ch, state, inputIndex, glyphSet, errorChar, charClass,
    295             output, glyphStorage, outputIndex);
    296 
    297         if (charClass >= CON && charClass <= COD) {
    298             conState = state;
    299             conInput = inputIndex;
    300             conOutput = outputIndex;
    301         }
    302     }
    303 
    304     return outputIndex;
    305 }
    306 
    307 U_NAMESPACE_END
    308