1 /* 2 * libjingle 3 * Copyright 2004--2005, Google Inc. 4 * 5 * Redistribution and use in source and binary forms, with or without 6 * modification, are permitted provided that the following conditions are met: 7 * 8 * 1. Redistributions of source code must retain the above copyright notice, 9 * this list of conditions and the following disclaimer. 10 * 2. Redistributions in binary form must reproduce the above copyright notice, 11 * this list of conditions and the following disclaimer in the documentation 12 * and/or other materials provided with the distribution. 13 * 3. The name of the author may not be used to endorse or promote products 14 * derived from this software without specific prior written permission. 15 * 16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED 17 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF 18 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO 19 * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 20 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 21 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; 22 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, 23 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR 24 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF 25 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 26 */ 27 28 #ifndef TALK_BASE_STRINGUTILS_H__ 29 #define TALK_BASE_STRINGUTILS_H__ 30 31 #include <ctype.h> 32 #include <stdarg.h> 33 #include <stdio.h> 34 35 #ifdef WIN32 36 #include <malloc.h> 37 #include <wchar.h> 38 #define alloca _alloca 39 #endif // WIN32 40 41 #ifdef POSIX 42 #ifdef BSD 43 #include <stdlib.h> 44 #else // BSD 45 #include <alloca.h> 46 #endif // !BSD 47 #endif // POSIX 48 49 #include <cstring> 50 #include <string> 51 52 #include "talk/base/basictypes.h" 53 54 /////////////////////////////////////////////////////////////////////////////// 55 // Generic string/memory utilities 56 /////////////////////////////////////////////////////////////////////////////// 57 58 #define STACK_ARRAY(TYPE, LEN) static_cast<TYPE*>(::alloca((LEN)*sizeof(TYPE))) 59 60 namespace talk_base { 61 62 // Complement to memset. Verifies memory consists of count bytes of value c. 63 bool memory_check(const void* memory, int c, size_t count); 64 65 // Determines whether the simple wildcard pattern matches target. 66 // Alpha characters in pattern match case-insensitively. 67 // Asterisks in pattern match 0 or more characters. 68 // Ex: string_match("www.TEST.GOOGLE.COM", "www.*.com") -> true 69 bool string_match(const char* target, const char* pattern); 70 71 } // namespace talk_base 72 73 /////////////////////////////////////////////////////////////////////////////// 74 // Rename a bunch of common string functions so they are consistent across 75 // platforms and between char and wchar_t variants. 76 // Here is the full list of functions that are unified: 77 // strlen, strcmp, stricmp, strncmp, strnicmp 78 // strchr, vsnprintf, strtoul, tolowercase 79 // tolowercase is like tolower, but not compatible with end-of-file value 80 // 81 // It's not clear if we will ever use wchar_t strings on unix. In theory, 82 // all strings should be Utf8 all the time, except when interfacing with Win32 83 // APIs that require Utf16. 84 /////////////////////////////////////////////////////////////////////////////// 85 86 inline char tolowercase(char c) { 87 return static_cast<char>(tolower(c)); 88 } 89 90 #ifdef WIN32 91 92 inline size_t strlen(const wchar_t* s) { 93 return wcslen(s); 94 } 95 inline int strcmp(const wchar_t* s1, const wchar_t* s2) { 96 return wcscmp(s1, s2); 97 } 98 inline int stricmp(const wchar_t* s1, const wchar_t* s2) { 99 return _wcsicmp(s1, s2); 100 } 101 inline int strncmp(const wchar_t* s1, const wchar_t* s2, size_t n) { 102 return wcsncmp(s1, s2, n); 103 } 104 inline int strnicmp(const wchar_t* s1, const wchar_t* s2, size_t n) { 105 return _wcsnicmp(s1, s2, n); 106 } 107 inline const wchar_t* strchr(const wchar_t* s, wchar_t c) { 108 return wcschr(s, c); 109 } 110 inline const wchar_t* strstr(const wchar_t* haystack, const wchar_t* needle) { 111 return wcsstr(haystack, needle); 112 } 113 #ifndef vsnprintf 114 inline int vsnprintf(wchar_t* buf, size_t n, const wchar_t* fmt, va_list args) { 115 return _vsnwprintf(buf, n, fmt, args); 116 } 117 #endif // !vsnprintf 118 inline unsigned long strtoul(const wchar_t* snum, wchar_t** end, int base) { 119 return wcstoul(snum, end, base); 120 } 121 inline wchar_t tolowercase(wchar_t c) { 122 return static_cast<wchar_t>(towlower(c)); 123 } 124 125 #endif // WIN32 126 127 #ifdef POSIX 128 129 inline int _stricmp(const char* s1, const char* s2) { 130 return strcasecmp(s1, s2); 131 } 132 inline int _strnicmp(const char* s1, const char* s2, size_t n) { 133 return strncasecmp(s1, s2, n); 134 } 135 136 #endif // POSIX 137 138 /////////////////////////////////////////////////////////////////////////////// 139 // Traits simplifies porting string functions to be CTYPE-agnostic 140 /////////////////////////////////////////////////////////////////////////////// 141 142 namespace talk_base { 143 144 const size_t SIZE_UNKNOWN = static_cast<size_t>(-1); 145 146 template<class CTYPE> 147 struct Traits { 148 // STL string type 149 //typedef XXX string; 150 // Null-terminated string 151 //inline static const CTYPE* empty_str(); 152 }; 153 154 /////////////////////////////////////////////////////////////////////////////// 155 // String utilities which work with char or wchar_t 156 /////////////////////////////////////////////////////////////////////////////// 157 158 template<class CTYPE> 159 inline const CTYPE* nonnull(const CTYPE* str, const CTYPE* def_str = NULL) { 160 return str ? str : (def_str ? def_str : Traits<CTYPE>::empty_str()); 161 } 162 163 template<class CTYPE> 164 const CTYPE* strchr(const CTYPE* str, const CTYPE* chs) { 165 for (size_t i=0; str[i]; ++i) { 166 for (size_t j=0; chs[j]; ++j) { 167 if (str[i] == chs[j]) { 168 return str + i; 169 } 170 } 171 } 172 return 0; 173 } 174 175 template<class CTYPE> 176 const CTYPE* strchrn(const CTYPE* str, size_t slen, CTYPE ch) { 177 for (size_t i=0; i<slen && str[i]; ++i) { 178 if (str[i] == ch) { 179 return str + i; 180 } 181 } 182 return 0; 183 } 184 185 template<class CTYPE> 186 size_t strlenn(const CTYPE* buffer, size_t buflen) { 187 size_t bufpos = 0; 188 while (buffer[bufpos] && (bufpos < buflen)) { 189 ++bufpos; 190 } 191 return bufpos; 192 } 193 194 // Safe versions of strncpy, strncat, snprintf and vsnprintf that always 195 // null-terminate. 196 197 template<class CTYPE> 198 size_t strcpyn(CTYPE* buffer, size_t buflen, 199 const CTYPE* source, size_t srclen = SIZE_UNKNOWN) { 200 if (buflen <= 0) 201 return 0; 202 203 if (srclen == SIZE_UNKNOWN) { 204 srclen = strlenn(source, buflen - 1); 205 } else if (srclen >= buflen) { 206 srclen = buflen - 1; 207 } 208 memcpy(buffer, source, srclen * sizeof(CTYPE)); 209 buffer[srclen] = 0; 210 return srclen; 211 } 212 213 template<class CTYPE> 214 size_t strcatn(CTYPE* buffer, size_t buflen, 215 const CTYPE* source, size_t srclen = SIZE_UNKNOWN) { 216 if (buflen <= 0) 217 return 0; 218 219 size_t bufpos = strlenn(buffer, buflen - 1); 220 return bufpos + strcpyn(buffer + bufpos, buflen - bufpos, source, srclen); 221 } 222 223 // Some compilers (clang specifically) require vsprintfn be defined before 224 // sprintfn. 225 template<class CTYPE> 226 size_t vsprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, 227 va_list args) { 228 int len = vsnprintf(buffer, buflen, format, args); 229 if ((len < 0) || (static_cast<size_t>(len) >= buflen)) { 230 len = static_cast<int>(buflen - 1); 231 buffer[len] = 0; 232 } 233 return len; 234 } 235 236 template<class CTYPE> 237 size_t sprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, ...); 238 template<class CTYPE> 239 size_t sprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, ...) { 240 va_list args; 241 va_start(args, format); 242 size_t len = vsprintfn(buffer, buflen, format, args); 243 va_end(args); 244 return len; 245 } 246 247 /////////////////////////////////////////////////////////////////////////////// 248 // Allow safe comparing and copying ascii (not UTF-8) with both wide and 249 // non-wide character strings. 250 /////////////////////////////////////////////////////////////////////////////// 251 252 inline int asccmp(const char* s1, const char* s2) { 253 return strcmp(s1, s2); 254 } 255 inline int ascicmp(const char* s1, const char* s2) { 256 return _stricmp(s1, s2); 257 } 258 inline int ascncmp(const char* s1, const char* s2, size_t n) { 259 return strncmp(s1, s2, n); 260 } 261 inline int ascnicmp(const char* s1, const char* s2, size_t n) { 262 return _strnicmp(s1, s2, n); 263 } 264 inline size_t asccpyn(char* buffer, size_t buflen, 265 const char* source, size_t srclen = SIZE_UNKNOWN) { 266 return strcpyn(buffer, buflen, source, srclen); 267 } 268 269 #ifdef WIN32 270 271 typedef wchar_t(*CharacterTransformation)(wchar_t); 272 inline wchar_t identity(wchar_t c) { return c; } 273 int ascii_string_compare(const wchar_t* s1, const char* s2, size_t n, 274 CharacterTransformation transformation); 275 276 inline int asccmp(const wchar_t* s1, const char* s2) { 277 return ascii_string_compare(s1, s2, static_cast<size_t>(-1), identity); 278 } 279 inline int ascicmp(const wchar_t* s1, const char* s2) { 280 return ascii_string_compare(s1, s2, static_cast<size_t>(-1), tolowercase); 281 } 282 inline int ascncmp(const wchar_t* s1, const char* s2, size_t n) { 283 return ascii_string_compare(s1, s2, n, identity); 284 } 285 inline int ascnicmp(const wchar_t* s1, const char* s2, size_t n) { 286 return ascii_string_compare(s1, s2, n, tolowercase); 287 } 288 size_t asccpyn(wchar_t* buffer, size_t buflen, 289 const char* source, size_t srclen = SIZE_UNKNOWN); 290 291 #endif // WIN32 292 293 /////////////////////////////////////////////////////////////////////////////// 294 // Traits<char> specializations 295 /////////////////////////////////////////////////////////////////////////////// 296 297 template<> 298 struct Traits<char> { 299 typedef std::string string; 300 inline static const char* empty_str() { return ""; } 301 }; 302 303 /////////////////////////////////////////////////////////////////////////////// 304 // Traits<wchar_t> specializations (Windows only, currently) 305 /////////////////////////////////////////////////////////////////////////////// 306 307 #ifdef WIN32 308 309 template<> 310 struct Traits<wchar_t> { 311 typedef std::wstring string; 312 inline static const wchar_t* Traits<wchar_t>::empty_str() { return L""; } 313 }; 314 315 #endif // WIN32 316 317 // Replaces all occurrences of "search" with "replace". 318 void replace_substrs(const char *search, 319 size_t search_len, 320 const char *replace, 321 size_t replace_len, 322 std::string *s); 323 324 // True iff s1 starts with s2. 325 bool starts_with(const char *s1, const char *s2); 326 327 // True iff s1 ends with s2. 328 bool ends_with(const char *s1, const char *s2); 329 330 // Remove leading and trailing whitespaces. 331 std::string string_trim(const std::string& s); 332 333 } // namespace talk_base 334 335 #endif // TALK_BASE_STRINGUTILS_H__ 336