1 /* 2 * Copyright 2014 Google Inc. All rights reserved. 3 * 4 * Licensed under the Apache License, Version 2.0 (the "License"); 5 * you may not use this file except in compliance with the License. 6 * You may obtain a copy of the License at 7 * 8 * http://www.apache.org/licenses/LICENSE-2.0 9 * 10 * Unless required by applicable law or agreed to in writing, software 11 * distributed under the License is distributed on an "AS IS" BASIS, 12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13 * See the License for the specific language governing permissions and 14 * limitations under the License. 15 */ 16 17 #ifndef FLATBUFFERS_UTIL_H_ 18 #define FLATBUFFERS_UTIL_H_ 19 20 #include "flatbuffers/base.h" 21 22 #include <errno.h> 23 24 #ifndef FLATBUFFERS_PREFER_PRINTF 25 # include <sstream> 26 #else // FLATBUFFERS_PREFER_PRINTF 27 # include <float.h> 28 # include <stdio.h> 29 #endif // FLATBUFFERS_PREFER_PRINTF 30 31 #include <iomanip> 32 #include <string> 33 34 namespace flatbuffers { 35 36 // @locale-independent functions for ASCII characters set. 37 38 // Check that integer scalar is in closed range: (a <= x <= b) 39 // using one compare (conditional branch) operator. 40 template<typename T> inline bool check_in_range(T x, T a, T b) { 41 // (Hacker's Delight): `a <= x <= b` <=> `(x-a) <={u} (b-a)`. 42 FLATBUFFERS_ASSERT(a <= b); // static_assert only if 'a' & 'b' templated 43 typedef typename flatbuffers::make_unsigned<T>::type U; 44 return (static_cast<U>(x - a) <= static_cast<U>(b - a)); 45 } 46 47 // Case-insensitive isalpha 48 inline bool is_alpha(char c) { 49 // ASCII only: alpha to upper case => reset bit 0x20 (~0x20 = 0xDF). 50 return check_in_range(c & 0xDF, 'a' & 0xDF, 'z' & 0xDF); 51 } 52 53 // Check (case-insensitive) that `c` is equal to alpha. 54 inline bool is_alpha_char(char c, char alpha) { 55 FLATBUFFERS_ASSERT(is_alpha(alpha)); 56 // ASCII only: alpha to upper case => reset bit 0x20 (~0x20 = 0xDF). 57 return ((c & 0xDF) == (alpha & 0xDF)); 58 } 59 60 // https://en.cppreference.com/w/cpp/string/byte/isxdigit 61 // isdigit and isxdigit are the only standard narrow character classification 62 // functions that are not affected by the currently installed C locale. although 63 // some implementations (e.g. Microsoft in 1252 codepage) may classify 64 // additional single-byte characters as digits. 65 inline bool is_digit(char c) { return check_in_range(c, '0', '9'); } 66 67 inline bool is_xdigit(char c) { 68 // Replace by look-up table. 69 return is_digit(c) || check_in_range(c & 0xDF, 'a' & 0xDF, 'f' & 0xDF); 70 } 71 72 // Case-insensitive isalnum 73 inline bool is_alnum(char c) { return is_alpha(c) || is_digit(c); } 74 75 // @end-locale-independent functions for ASCII character set 76 77 #ifdef FLATBUFFERS_PREFER_PRINTF 78 template<typename T> size_t IntToDigitCount(T t) { 79 size_t digit_count = 0; 80 // Count the sign for negative numbers 81 if (t < 0) digit_count++; 82 // Count a single 0 left of the dot for fractional numbers 83 if (-1 < t && t < 1) digit_count++; 84 // Count digits until fractional part 85 T eps = std::numeric_limits<float>::epsilon(); 86 while (t <= (-1 + eps) || (1 - eps) <= t) { 87 t /= 10; 88 digit_count++; 89 } 90 return digit_count; 91 } 92 93 template<typename T> size_t NumToStringWidth(T t, int precision = 0) { 94 size_t string_width = IntToDigitCount(t); 95 // Count the dot for floating point numbers 96 if (precision) string_width += (precision + 1); 97 return string_width; 98 } 99 100 template<typename T> 101 std::string NumToStringImplWrapper(T t, const char *fmt, int precision = 0) { 102 size_t string_width = NumToStringWidth(t, precision); 103 std::string s(string_width, 0x00); 104 // Allow snprintf to use std::string trailing null to detect buffer overflow 105 snprintf(const_cast<char *>(s.data()), (s.size() + 1), fmt, precision, t); 106 return s; 107 } 108 #endif // FLATBUFFERS_PREFER_PRINTF 109 110 // Convert an integer or floating point value to a string. 111 // In contrast to std::stringstream, "char" values are 112 // converted to a string of digits, and we don't use scientific notation. 113 template<typename T> std::string NumToString(T t) { 114 // clang-format off 115 116 #ifndef FLATBUFFERS_PREFER_PRINTF 117 std::stringstream ss; 118 ss << t; 119 return ss.str(); 120 #else // FLATBUFFERS_PREFER_PRINTF 121 auto v = static_cast<long long>(t); 122 return NumToStringImplWrapper(v, "%.*lld"); 123 #endif // FLATBUFFERS_PREFER_PRINTF 124 // clang-format on 125 } 126 // Avoid char types used as character data. 127 template<> inline std::string NumToString<signed char>(signed char t) { 128 return NumToString(static_cast<int>(t)); 129 } 130 template<> inline std::string NumToString<unsigned char>(unsigned char t) { 131 return NumToString(static_cast<int>(t)); 132 } 133 template<> inline std::string NumToString<char>(char t) { 134 return NumToString(static_cast<int>(t)); 135 } 136 #if defined(FLATBUFFERS_CPP98_STL) 137 template<> inline std::string NumToString<long long>(long long t) { 138 char buf[21]; // (log((1 << 63) - 1) / log(10)) + 2 139 snprintf(buf, sizeof(buf), "%lld", t); 140 return std::string(buf); 141 } 142 143 template<> 144 inline std::string NumToString<unsigned long long>(unsigned long long t) { 145 char buf[22]; // (log((1 << 63) - 1) / log(10)) + 1 146 snprintf(buf, sizeof(buf), "%llu", t); 147 return std::string(buf); 148 } 149 #endif // defined(FLATBUFFERS_CPP98_STL) 150 151 // Special versions for floats/doubles. 152 template<typename T> std::string FloatToString(T t, int precision) { 153 // clang-format off 154 155 #ifndef FLATBUFFERS_PREFER_PRINTF 156 // to_string() prints different numbers of digits for floats depending on 157 // platform and isn't available on Android, so we use stringstream 158 std::stringstream ss; 159 // Use std::fixed to suppress scientific notation. 160 ss << std::fixed; 161 // Default precision is 6, we want that to be higher for doubles. 162 ss << std::setprecision(precision); 163 ss << t; 164 auto s = ss.str(); 165 #else // FLATBUFFERS_PREFER_PRINTF 166 auto v = static_cast<double>(t); 167 auto s = NumToStringImplWrapper(v, "%0.*f", precision); 168 #endif // FLATBUFFERS_PREFER_PRINTF 169 // clang-format on 170 // Sadly, std::fixed turns "1" into "1.00000", so here we undo that. 171 auto p = s.find_last_not_of('0'); 172 if (p != std::string::npos) { 173 // Strip trailing zeroes. If it is a whole number, keep one zero. 174 s.resize(p + (s[p] == '.' ? 2 : 1)); 175 } 176 return s; 177 } 178 179 template<> inline std::string NumToString<double>(double t) { 180 return FloatToString(t, 12); 181 } 182 template<> inline std::string NumToString<float>(float t) { 183 return FloatToString(t, 6); 184 } 185 186 // Convert an integer value to a hexadecimal string. 187 // The returned string length is always xdigits long, prefixed by 0 digits. 188 // For example, IntToStringHex(0x23, 8) returns the string "00000023". 189 inline std::string IntToStringHex(int i, int xdigits) { 190 FLATBUFFERS_ASSERT(i >= 0); 191 // clang-format off 192 193 #ifndef FLATBUFFERS_PREFER_PRINTF 194 std::stringstream ss; 195 ss << std::setw(xdigits) << std::setfill('0') << std::hex << std::uppercase 196 << i; 197 return ss.str(); 198 #else // FLATBUFFERS_PREFER_PRINTF 199 return NumToStringImplWrapper(i, "%.*X", xdigits); 200 #endif // FLATBUFFERS_PREFER_PRINTF 201 // clang-format on 202 } 203 204 // clang-format off 205 // Use locale independent functions {strtod_l, strtof_l, strtoll_l, strtoull_l}. 206 #if defined(FLATBUFFERS_LOCALE_INDEPENDENT) && (FLATBUFFERS_LOCALE_INDEPENDENT > 0) 207 class ClassicLocale { 208 #ifdef _MSC_VER 209 typedef _locale_t locale_type; 210 #else 211 typedef locale_t locale_type; // POSIX.1-2008 locale_t type 212 #endif 213 ClassicLocale(); 214 ~ClassicLocale(); 215 locale_type locale_; 216 static ClassicLocale instance_; 217 public: 218 static locale_type Get() { return instance_.locale_; } 219 }; 220 221 #ifdef _MSC_VER 222 #define __strtoull_impl(s, pe, b) _strtoui64_l(s, pe, b, ClassicLocale::Get()) 223 #define __strtoll_impl(s, pe, b) _strtoi64_l(s, pe, b, ClassicLocale::Get()) 224 #define __strtod_impl(s, pe) _strtod_l(s, pe, ClassicLocale::Get()) 225 #define __strtof_impl(s, pe) _strtof_l(s, pe, ClassicLocale::Get()) 226 #else 227 #define __strtoull_impl(s, pe, b) strtoull_l(s, pe, b, ClassicLocale::Get()) 228 #define __strtoll_impl(s, pe, b) strtoll_l(s, pe, b, ClassicLocale::Get()) 229 #define __strtod_impl(s, pe) strtod_l(s, pe, ClassicLocale::Get()) 230 #define __strtof_impl(s, pe) strtof_l(s, pe, ClassicLocale::Get()) 231 #endif 232 #else 233 #define __strtod_impl(s, pe) strtod(s, pe) 234 #define __strtof_impl(s, pe) static_cast<float>(strtod(s, pe)) 235 #ifdef _MSC_VER 236 #define __strtoull_impl(s, pe, b) _strtoui64(s, pe, b) 237 #define __strtoll_impl(s, pe, b) _strtoi64(s, pe, b) 238 #else 239 #define __strtoull_impl(s, pe, b) strtoull(s, pe, b) 240 #define __strtoll_impl(s, pe, b) strtoll(s, pe, b) 241 #endif 242 #endif 243 244 inline void strtoval_impl(int64_t *val, const char *str, char **endptr, 245 int base) { 246 *val = __strtoll_impl(str, endptr, base); 247 } 248 249 inline void strtoval_impl(uint64_t *val, const char *str, char **endptr, 250 int base) { 251 *val = __strtoull_impl(str, endptr, base); 252 } 253 254 inline void strtoval_impl(double *val, const char *str, char **endptr) { 255 *val = __strtod_impl(str, endptr); 256 } 257 258 // UBSAN: double to float is safe if numeric_limits<float>::is_iec559 is true. 259 __supress_ubsan__("float-cast-overflow") 260 inline void strtoval_impl(float *val, const char *str, char **endptr) { 261 *val = __strtof_impl(str, endptr); 262 } 263 #undef __strtoull_impl 264 #undef __strtoll_impl 265 #undef __strtod_impl 266 #undef __strtof_impl 267 // clang-format on 268 269 // Adaptor for strtoull()/strtoll(). 270 // Flatbuffers accepts numbers with any count of leading zeros (-009 is -9), 271 // while strtoll with base=0 interprets first leading zero as octal prefix. 272 // In future, it is possible to add prefixed 0b0101. 273 // 1) Checks errno code for overflow condition (out of range). 274 // 2) If base <= 0, function try to detect base of number by prefix. 275 // 276 // Return value (like strtoull and strtoll, but reject partial result): 277 // - If successful, an integer value corresponding to the str is returned. 278 // - If full string conversion can't be performed, 0 is returned. 279 // - If the converted value falls out of range of corresponding return type, a 280 // range error occurs. In this case value MAX(T)/MIN(T) is returned. 281 template<typename T> 282 inline bool StringToIntegerImpl(T *val, const char *const str, 283 const int base = 0, 284 const bool check_errno = true) { 285 // T is int64_t or uint64_T 286 FLATBUFFERS_ASSERT(str); 287 if (base <= 0) { 288 auto s = str; 289 while (*s && !is_digit(*s)) s++; 290 if (s[0] == '0' && is_alpha_char(s[1], 'X')) 291 return StringToIntegerImpl(val, str, 16, check_errno); 292 // if a prefix not match, try base=10 293 return StringToIntegerImpl(val, str, 10, check_errno); 294 } else { 295 if (check_errno) errno = 0; // clear thread-local errno 296 auto endptr = str; 297 strtoval_impl(val, str, const_cast<char **>(&endptr), base); 298 if ((*endptr != '\0') || (endptr == str)) { 299 *val = 0; // erase partial result 300 return false; // invalid string 301 } 302 // errno is out-of-range, return MAX/MIN 303 if (check_errno && errno) return false; 304 return true; 305 } 306 } 307 308 template<typename T> 309 inline bool StringToFloatImpl(T *val, const char *const str) { 310 // Type T must be either float or double. 311 FLATBUFFERS_ASSERT(str && val); 312 auto end = str; 313 strtoval_impl(val, str, const_cast<char **>(&end)); 314 auto done = (end != str) && (*end == '\0'); 315 if (!done) *val = 0; // erase partial result 316 return done; 317 } 318 319 // Convert a string to an instance of T. 320 // Return value (matched with StringToInteger64Impl and strtod): 321 // - If successful, a numeric value corresponding to the str is returned. 322 // - If full string conversion can't be performed, 0 is returned. 323 // - If the converted value falls out of range of corresponding return type, a 324 // range error occurs. In this case value MAX(T)/MIN(T) is returned. 325 template<typename T> inline bool StringToNumber(const char *s, T *val) { 326 FLATBUFFERS_ASSERT(s && val); 327 int64_t i64; 328 // The errno check isn't needed, will return MAX/MIN on overflow. 329 if (StringToIntegerImpl(&i64, s, 0, false)) { 330 const int64_t max = flatbuffers::numeric_limits<T>::max(); 331 const int64_t min = flatbuffers::numeric_limits<T>::lowest(); 332 if (i64 > max) { 333 *val = static_cast<T>(max); 334 return false; 335 } 336 if (i64 < min) { 337 // For unsigned types return max to distinguish from 338 // "no conversion can be performed" when 0 is returned. 339 *val = static_cast<T>(flatbuffers::is_unsigned<T>::value ? max : min); 340 return false; 341 } 342 *val = static_cast<T>(i64); 343 return true; 344 } 345 *val = 0; 346 return false; 347 } 348 349 template<> inline bool StringToNumber<int64_t>(const char *str, int64_t *val) { 350 return StringToIntegerImpl(val, str); 351 } 352 353 template<> 354 inline bool StringToNumber<uint64_t>(const char *str, uint64_t *val) { 355 if (!StringToIntegerImpl(val, str)) return false; 356 // The strtoull accepts negative numbers: 357 // If the minus sign was part of the input sequence, the numeric value 358 // calculated from the sequence of digits is negated as if by unary minus 359 // in the result type, which applies unsigned integer wraparound rules. 360 // Fix this behaviour (except -0). 361 if (*val) { 362 auto s = str; 363 while (*s && !is_digit(*s)) s++; 364 s = (s > str) ? (s - 1) : s; // step back to one symbol 365 if (*s == '-') { 366 // For unsigned types return the max to distinguish from 367 // "no conversion can be performed". 368 *val = flatbuffers::numeric_limits<uint64_t>::max(); 369 return false; 370 } 371 } 372 return true; 373 } 374 375 template<> inline bool StringToNumber(const char *s, float *val) { 376 return StringToFloatImpl(val, s); 377 } 378 379 template<> inline bool StringToNumber(const char *s, double *val) { 380 return StringToFloatImpl(val, s); 381 } 382 383 inline int64_t StringToInt(const char *s, int base = 10) { 384 int64_t val; 385 return StringToIntegerImpl(&val, s, base) ? val : 0; 386 } 387 388 inline uint64_t StringToUInt(const char *s, int base = 10) { 389 uint64_t val; 390 return StringToIntegerImpl(&val, s, base) ? val : 0; 391 } 392 393 typedef bool (*LoadFileFunction)(const char *filename, bool binary, 394 std::string *dest); 395 typedef bool (*FileExistsFunction)(const char *filename); 396 397 LoadFileFunction SetLoadFileFunction(LoadFileFunction load_file_function); 398 399 FileExistsFunction SetFileExistsFunction( 400 FileExistsFunction file_exists_function); 401 402 // Check if file "name" exists. 403 bool FileExists(const char *name); 404 405 // Check if "name" exists and it is also a directory. 406 bool DirExists(const char *name); 407 408 // Load file "name" into "buf" returning true if successful 409 // false otherwise. If "binary" is false data is read 410 // using ifstream's text mode, otherwise data is read with 411 // no transcoding. 412 bool LoadFile(const char *name, bool binary, std::string *buf); 413 414 // Save data "buf" of length "len" bytes into a file 415 // "name" returning true if successful, false otherwise. 416 // If "binary" is false data is written using ifstream's 417 // text mode, otherwise data is written with no 418 // transcoding. 419 bool SaveFile(const char *name, const char *buf, size_t len, bool binary); 420 421 // Save data "buf" into file "name" returning true if 422 // successful, false otherwise. If "binary" is false 423 // data is written using ifstream's text mode, otherwise 424 // data is written with no transcoding. 425 inline bool SaveFile(const char *name, const std::string &buf, bool binary) { 426 return SaveFile(name, buf.c_str(), buf.size(), binary); 427 } 428 429 // Functionality for minimalistic portable path handling. 430 431 // The functions below behave correctly regardless of whether posix ('/') or 432 // Windows ('/' or '\\') separators are used. 433 434 // Any new separators inserted are always posix. 435 FLATBUFFERS_CONSTEXPR char kPathSeparator = '/'; 436 437 // Returns the path with the extension, if any, removed. 438 std::string StripExtension(const std::string &filepath); 439 440 // Returns the extension, if any. 441 std::string GetExtension(const std::string &filepath); 442 443 // Return the last component of the path, after the last separator. 444 std::string StripPath(const std::string &filepath); 445 446 // Strip the last component of the path + separator. 447 std::string StripFileName(const std::string &filepath); 448 449 // Concatenates a path with a filename, regardless of wether the path 450 // ends in a separator or not. 451 std::string ConCatPathFileName(const std::string &path, 452 const std::string &filename); 453 454 // Replaces any '\\' separators with '/' 455 std::string PosixPath(const char *path); 456 457 // This function ensure a directory exists, by recursively 458 // creating dirs for any parts of the path that don't exist yet. 459 void EnsureDirExists(const std::string &filepath); 460 461 // Obtains the absolute path from any other path. 462 // Returns the input path if the absolute path couldn't be resolved. 463 std::string AbsolutePath(const std::string &filepath); 464 465 // To and from UTF-8 unicode conversion functions 466 467 // Convert a unicode code point into a UTF-8 representation by appending it 468 // to a string. Returns the number of bytes generated. 469 inline int ToUTF8(uint32_t ucc, std::string *out) { 470 FLATBUFFERS_ASSERT(!(ucc & 0x80000000)); // Top bit can't be set. 471 // 6 possible encodings: http://en.wikipedia.org/wiki/UTF-8 472 for (int i = 0; i < 6; i++) { 473 // Max bits this encoding can represent. 474 uint32_t max_bits = 6 + i * 5 + static_cast<int>(!i); 475 if (ucc < (1u << max_bits)) { // does it fit? 476 // Remaining bits not encoded in the first byte, store 6 bits each 477 uint32_t remain_bits = i * 6; 478 // Store first byte: 479 (*out) += static_cast<char>((0xFE << (max_bits - remain_bits)) | 480 (ucc >> remain_bits)); 481 // Store remaining bytes: 482 for (int j = i - 1; j >= 0; j--) { 483 (*out) += static_cast<char>(((ucc >> (j * 6)) & 0x3F) | 0x80); 484 } 485 return i + 1; // Return the number of bytes added. 486 } 487 } 488 FLATBUFFERS_ASSERT(0); // Impossible to arrive here. 489 return -1; 490 } 491 492 // Converts whatever prefix of the incoming string corresponds to a valid 493 // UTF-8 sequence into a unicode code. The incoming pointer will have been 494 // advanced past all bytes parsed. 495 // returns -1 upon corrupt UTF-8 encoding (ignore the incoming pointer in 496 // this case). 497 inline int FromUTF8(const char **in) { 498 int len = 0; 499 // Count leading 1 bits. 500 for (int mask = 0x80; mask >= 0x04; mask >>= 1) { 501 if (**in & mask) { 502 len++; 503 } else { 504 break; 505 } 506 } 507 if ((static_cast<unsigned char>(**in) << len) & 0x80) 508 return -1; // Bit after leading 1's must be 0. 509 if (!len) return *(*in)++; 510 // UTF-8 encoded values with a length are between 2 and 4 bytes. 511 if (len < 2 || len > 4) { return -1; } 512 // Grab initial bits of the code. 513 int ucc = *(*in)++ & ((1 << (7 - len)) - 1); 514 for (int i = 0; i < len - 1; i++) { 515 if ((**in & 0xC0) != 0x80) return -1; // Upper bits must 1 0. 516 ucc <<= 6; 517 ucc |= *(*in)++ & 0x3F; // Grab 6 more bits of the code. 518 } 519 // UTF-8 cannot encode values between 0xD800 and 0xDFFF (reserved for 520 // UTF-16 surrogate pairs). 521 if (ucc >= 0xD800 && ucc <= 0xDFFF) { return -1; } 522 // UTF-8 must represent code points in their shortest possible encoding. 523 switch (len) { 524 case 2: 525 // Two bytes of UTF-8 can represent code points from U+0080 to U+07FF. 526 if (ucc < 0x0080 || ucc > 0x07FF) { return -1; } 527 break; 528 case 3: 529 // Three bytes of UTF-8 can represent code points from U+0800 to U+FFFF. 530 if (ucc < 0x0800 || ucc > 0xFFFF) { return -1; } 531 break; 532 case 4: 533 // Four bytes of UTF-8 can represent code points from U+10000 to U+10FFFF. 534 if (ucc < 0x10000 || ucc > 0x10FFFF) { return -1; } 535 break; 536 } 537 return ucc; 538 } 539 540 #ifndef FLATBUFFERS_PREFER_PRINTF 541 // Wraps a string to a maximum length, inserting new lines where necessary. Any 542 // existing whitespace will be collapsed down to a single space. A prefix or 543 // suffix can be provided, which will be inserted before or after a wrapped 544 // line, respectively. 545 inline std::string WordWrap(const std::string in, size_t max_length, 546 const std::string wrapped_line_prefix, 547 const std::string wrapped_line_suffix) { 548 std::istringstream in_stream(in); 549 std::string wrapped, line, word; 550 551 in_stream >> word; 552 line = word; 553 554 while (in_stream >> word) { 555 if ((line.length() + 1 + word.length() + wrapped_line_suffix.length()) < 556 max_length) { 557 line += " " + word; 558 } else { 559 wrapped += line + wrapped_line_suffix + "\n"; 560 line = wrapped_line_prefix + word; 561 } 562 } 563 wrapped += line; 564 565 return wrapped; 566 } 567 #endif // !FLATBUFFERS_PREFER_PRINTF 568 569 inline bool EscapeString(const char *s, size_t length, std::string *_text, 570 bool allow_non_utf8, bool natural_utf8) { 571 std::string &text = *_text; 572 text += "\""; 573 for (uoffset_t i = 0; i < length; i++) { 574 char c = s[i]; 575 switch (c) { 576 case '\n': text += "\\n"; break; 577 case '\t': text += "\\t"; break; 578 case '\r': text += "\\r"; break; 579 case '\b': text += "\\b"; break; 580 case '\f': text += "\\f"; break; 581 case '\"': text += "\\\""; break; 582 case '\\': text += "\\\\"; break; 583 default: 584 if (c >= ' ' && c <= '~') { 585 text += c; 586 } else { 587 // Not printable ASCII data. Let's see if it's valid UTF-8 first: 588 const char *utf8 = s + i; 589 int ucc = FromUTF8(&utf8); 590 if (ucc < 0) { 591 if (allow_non_utf8) { 592 text += "\\x"; 593 text += IntToStringHex(static_cast<uint8_t>(c), 2); 594 } else { 595 // There are two cases here: 596 // 597 // 1) We reached here by parsing an IDL file. In that case, 598 // we previously checked for non-UTF-8, so we shouldn't reach 599 // here. 600 // 601 // 2) We reached here by someone calling GenerateText() 602 // on a previously-serialized flatbuffer. The data might have 603 // non-UTF-8 Strings, or might be corrupt. 604 // 605 // In both cases, we have to give up and inform the caller 606 // they have no JSON. 607 return false; 608 } 609 } else { 610 if (natural_utf8) { 611 // utf8 points to past all utf-8 bytes parsed 612 text.append(s + i, static_cast<size_t>(utf8 - s - i)); 613 } else if (ucc <= 0xFFFF) { 614 // Parses as Unicode within JSON's \uXXXX range, so use that. 615 text += "\\u"; 616 text += IntToStringHex(ucc, 4); 617 } else if (ucc <= 0x10FFFF) { 618 // Encode Unicode SMP values to a surrogate pair using two \u 619 // escapes. 620 uint32_t base = ucc - 0x10000; 621 auto high_surrogate = (base >> 10) + 0xD800; 622 auto low_surrogate = (base & 0x03FF) + 0xDC00; 623 text += "\\u"; 624 text += IntToStringHex(high_surrogate, 4); 625 text += "\\u"; 626 text += IntToStringHex(low_surrogate, 4); 627 } 628 // Skip past characters recognized. 629 i = static_cast<uoffset_t>(utf8 - s - 1); 630 } 631 } 632 break; 633 } 634 } 635 text += "\""; 636 return true; 637 } 638 639 // Remove paired quotes in a string: "text"|'text' -> text. 640 std::string RemoveStringQuotes(const std::string &s); 641 642 // Change th global C-locale to locale with name <locale_name>. 643 // Returns an actual locale name in <_value>, useful if locale_name is "" or 644 // null. 645 bool SetGlobalTestLocale(const char *locale_name, 646 std::string *_value = nullptr); 647 648 // Read (or test) a value of environment variable. 649 bool ReadEnvironmentVariable(const char *var_name, 650 std::string *_value = nullptr); 651 652 } // namespace flatbuffers 653 654 #endif // FLATBUFFERS_UTIL_H_ 655