Home | History | Annotate | Download | only in dist

Lines Matching refs:utf

76            -1 if \C in UTF-8 mode or (*ACCEPT) was encountered
87 BOOL utf = (options & PCRE_UTF8) != 0;
229 if (utf && HAS_EXTRALEN(cc[-1])) cc += GET_EXTRALEN(cc[-1]);
250 if (utf && HAS_EXTRALEN(cc[-1])) cc += GET_EXTRALEN(cc[-1]);
292 /* The single-byte matcher means we can't proceed in UTF-8 mode. (In
293 non-UTF-8 mode \C will actually be turned into OP_ALLANY, so won't ever
298 if (utf) return -1;
393 ce = cs = (pcre_uchar *)PRIV(find_bracket)(startcode, utf, GET2(slot, 0));
418 ce = cs = (pcre_uchar *)PRIV(find_bracket)(startcode, utf, GET2(cc, 1));
489 of a character, we must take special action for UTF-8 characters. As it
536 if (utf && HAS_EXTRALEN(cc[-1])) cc += GET_EXTRALEN(cc[-1]);
579 UTF-8 mode, for characters greater than 127, we can only do the caseless thing
587 utf TRUE for UTF-8 / UTF-16 / UTF-32 mode
594 compile_data *cd, BOOL utf)
602 if (utf && c > 127)
617 (void)(utf); /* Stops warning for unused parameter */
620 /* Not UTF-8 mode, or character is less than 127. */
635 if (utf && c > 127)
650 (void)(utf); /* Stops warning for unused parameter */
664 /* This function sets starting bits for a character type. In UTF-8 mode, we can
666 confusion with bytes in the middle of UTF-8 characters. In a "traditional"
669 So we deal with that case by considering the UTF-8 encoding.
674 table_limit 32 for non-UTF-8; 16 for UTF-8
706 In UTF-8 mode, we can only do a direct setting for bytes less than 128, as
707 otherwise there can be confusion with bytes in the middle of UTF-8 characters.
709 specific high-valued UTF-8 characters, in this case we have to set the bits for
716 table_limit 32 for non-UTF-8; 16 for UTF-8
750 utf TRUE if in UTF-8 / UTF-16 / UTF-32 mode
760 set_start_bits(const pcre_uchar *code, pcre_uint8 *start_bits, BOOL utf,
766 int table_limit = utf? 16:32;
895 if (utf)
931 rc = set_start_bits(tcode, start_bits, utf, cd);
978 rc = set_start_bits(++tcode, start_bits, utf, cd);
1005 tcode = set_table_bit(start_bits, tcode + 1, FALSE, cd, utf);
1014 tcode = set_table_bit(start_bits, tcode + 1, TRUE, cd, utf);
1022 tcode = set_table_bit(start_bits, tcode + 1 + IMM2_SIZE, FALSE, cd, utf);
1028 tcode = set_table_bit(start_bits, tcode + 1 + IMM2_SIZE, TRUE, cd, utf);
1040 (void)set_table_bit(start_bits, tcode + 1, FALSE, cd, utf);
1051 (void)set_table_bit(start_bits, tcode + 1, TRUE, cd, utf);
1065 if (utf)
1097 if (utf)
1195 if (utf)
1221 if (utf)
1270 a negative class, and we are operating with UTF-8 characters, any byte
1286 if (utf)
1316 /* In UTF-8 mode, the bits in a bit map correspond to character
1327 if (utf)
1343 /* In non-UTF-8 mode, the two bit maps are completely compatible. */