| /* |
| * libjingle |
| * Copyright 2004--2005, Google Inc. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions are met: |
| * |
| * 1. Redistributions of source code must retain the above copyright notice, |
| * this list of conditions and the following disclaimer. |
| * 2. Redistributions in binary form must reproduce the above copyright notice, |
| * this list of conditions and the following disclaimer in the documentation |
| * and/or other materials provided with the distribution. |
| * 3. The name of the author may not be used to endorse or promote products |
| * derived from this software without specific prior written permission. |
| * |
| * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED |
| * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF |
| * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO |
| * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; |
| * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, |
| * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR |
| * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF |
| * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #ifndef TALK_BASE_STRINGUTILS_H__ |
| #define TALK_BASE_STRINGUTILS_H__ |
| |
| #include <ctype.h> |
| #include <stdarg.h> |
| #include <stdio.h> |
| #include <string.h> |
| |
| #ifdef WIN32 |
| #include <malloc.h> |
| #include <wchar.h> |
| #define alloca _alloca |
| #endif // WIN32 |
| |
| #ifdef POSIX |
| #ifdef BSD |
| #include <stdlib.h> |
| #else // BSD |
| #include <alloca.h> |
| #endif // !BSD |
| #endif // POSIX |
| |
| #include <string> |
| |
| #include "talk/base/basictypes.h" |
| |
| /////////////////////////////////////////////////////////////////////////////// |
| // Generic string/memory utilities |
| /////////////////////////////////////////////////////////////////////////////// |
| |
| #define STACK_ARRAY(TYPE, LEN) static_cast<TYPE*>(::alloca((LEN)*sizeof(TYPE))) |
| |
| namespace talk_base { |
| |
| // Complement to memset. Verifies memory consists of count bytes of value c. |
| bool memory_check(const void* memory, int c, size_t count); |
| |
| // Determines whether the simple wildcard pattern matches target. |
| // Alpha characters in pattern match case-insensitively. |
| // Asterisks in pattern match 0 or more characters. |
| // Ex: string_match("www.TEST.GOOGLE.COM", "www.*.com") -> true |
| bool string_match(const char* target, const char* pattern); |
| |
| } // namespace talk_base |
| |
| /////////////////////////////////////////////////////////////////////////////// |
| // Rename a bunch of common string functions so they are consistent across |
| // platforms and between char and wchar_t variants. |
| // Here is the full list of functions that are unified: |
| // strlen, strcmp, stricmp, strncmp, strnicmp |
| // strchr, vsnprintf, strtoul, tolowercase |
| // tolowercase is like tolower, but not compatible with end-of-file value |
| // |
| // It's not clear if we will ever use wchar_t strings on unix. In theory, |
| // all strings should be Utf8 all the time, except when interfacing with Win32 |
| // APIs that require Utf16. |
| /////////////////////////////////////////////////////////////////////////////// |
| |
| inline char tolowercase(char c) { |
| return static_cast<char>(tolower(c)); |
| } |
| |
| #ifdef WIN32 |
| |
| inline size_t strlen(const wchar_t* s) { |
| return wcslen(s); |
| } |
| inline int strcmp(const wchar_t* s1, const wchar_t* s2) { |
| return wcscmp(s1, s2); |
| } |
| inline int stricmp(const wchar_t* s1, const wchar_t* s2) { |
| return _wcsicmp(s1, s2); |
| } |
| inline int strncmp(const wchar_t* s1, const wchar_t* s2, size_t n) { |
| return wcsncmp(s1, s2, n); |
| } |
| inline int strnicmp(const wchar_t* s1, const wchar_t* s2, size_t n) { |
| return _wcsnicmp(s1, s2, n); |
| } |
| inline const wchar_t* strchr(const wchar_t* s, wchar_t c) { |
| return wcschr(s, c); |
| } |
| inline const wchar_t* strstr(const wchar_t* haystack, const wchar_t* needle) { |
| return wcsstr(haystack, needle); |
| } |
| #ifndef vsnprintf |
| inline int vsnprintf(wchar_t* buf, size_t n, const wchar_t* fmt, va_list args) { |
| return _vsnwprintf(buf, n, fmt, args); |
| } |
| #endif // !vsnprintf |
| inline unsigned long strtoul(const wchar_t* snum, wchar_t** end, int base) { |
| return wcstoul(snum, end, base); |
| } |
| inline wchar_t tolowercase(wchar_t c) { |
| return static_cast<wchar_t>(towlower(c)); |
| } |
| |
| #endif // WIN32 |
| |
| #ifdef POSIX |
| |
| inline int _stricmp(const char* s1, const char* s2) { |
| return strcasecmp(s1, s2); |
| } |
| inline int _strnicmp(const char* s1, const char* s2, size_t n) { |
| return strncasecmp(s1, s2, n); |
| } |
| |
| #endif // POSIX |
| |
| /////////////////////////////////////////////////////////////////////////////// |
| // Traits simplifies porting string functions to be CTYPE-agnostic |
| /////////////////////////////////////////////////////////////////////////////// |
| |
| namespace talk_base { |
| |
| const size_t SIZE_UNKNOWN = static_cast<size_t>(-1); |
| |
| template<class CTYPE> |
| struct Traits { |
| // STL string type |
| //typedef XXX string; |
| // Null-terminated string |
| //inline static const CTYPE* empty_str(); |
| }; |
| |
| /////////////////////////////////////////////////////////////////////////////// |
| // String utilities which work with char or wchar_t |
| /////////////////////////////////////////////////////////////////////////////// |
| |
| template<class CTYPE> |
| inline const CTYPE* nonnull(const CTYPE* str, const CTYPE* def_str = NULL) { |
| return str ? str : (def_str ? def_str : Traits<CTYPE>::empty_str()); |
| } |
| |
| template<class CTYPE> |
| const CTYPE* strchr(const CTYPE* str, const CTYPE* chs) { |
| for (size_t i=0; str[i]; ++i) { |
| for (size_t j=0; chs[j]; ++j) { |
| if (str[i] == chs[j]) { |
| return str + i; |
| } |
| } |
| } |
| return 0; |
| } |
| |
| template<class CTYPE> |
| const CTYPE* strchrn(const CTYPE* str, size_t slen, CTYPE ch) { |
| for (size_t i=0; i<slen && str[i]; ++i) { |
| if (str[i] == ch) { |
| return str + i; |
| } |
| } |
| return 0; |
| } |
| |
| template<class CTYPE> |
| size_t strlenn(const CTYPE* buffer, size_t buflen) { |
| size_t bufpos = 0; |
| while (buffer[bufpos] && (bufpos < buflen)) { |
| ++bufpos; |
| } |
| return bufpos; |
| } |
| |
| // Safe versions of strncpy, strncat, snprintf and vsnprintf that always |
| // null-terminate. |
| |
| template<class CTYPE> |
| size_t strcpyn(CTYPE* buffer, size_t buflen, |
| const CTYPE* source, size_t srclen = SIZE_UNKNOWN) { |
| if (buflen <= 0) |
| return 0; |
| |
| if (srclen == SIZE_UNKNOWN) { |
| srclen = strlenn(source, buflen - 1); |
| } else if (srclen >= buflen) { |
| srclen = buflen - 1; |
| } |
| memcpy(buffer, source, srclen * sizeof(CTYPE)); |
| buffer[srclen] = 0; |
| return srclen; |
| } |
| |
| template<class CTYPE> |
| size_t strcatn(CTYPE* buffer, size_t buflen, |
| const CTYPE* source, size_t srclen = SIZE_UNKNOWN) { |
| if (buflen <= 0) |
| return 0; |
| |
| size_t bufpos = strlenn(buffer, buflen - 1); |
| return bufpos + strcpyn(buffer + bufpos, buflen - bufpos, source, srclen); |
| } |
| |
| // Some compilers (clang specifically) require vsprintfn be defined before |
| // sprintfn. |
| template<class CTYPE> |
| size_t vsprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, |
| va_list args) { |
| int len = vsnprintf(buffer, buflen, format, args); |
| if ((len < 0) || (static_cast<size_t>(len) >= buflen)) { |
| len = static_cast<int>(buflen - 1); |
| buffer[len] = 0; |
| } |
| return len; |
| } |
| |
| template<class CTYPE> |
| size_t sprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, ...); |
| template<class CTYPE> |
| size_t sprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, ...) { |
| va_list args; |
| va_start(args, format); |
| size_t len = vsprintfn(buffer, buflen, format, args); |
| va_end(args); |
| return len; |
| } |
| |
| /////////////////////////////////////////////////////////////////////////////// |
| // Allow safe comparing and copying ascii (not UTF-8) with both wide and |
| // non-wide character strings. |
| /////////////////////////////////////////////////////////////////////////////// |
| |
| inline int asccmp(const char* s1, const char* s2) { |
| return strcmp(s1, s2); |
| } |
| inline int ascicmp(const char* s1, const char* s2) { |
| return _stricmp(s1, s2); |
| } |
| inline int ascncmp(const char* s1, const char* s2, size_t n) { |
| return strncmp(s1, s2, n); |
| } |
| inline int ascnicmp(const char* s1, const char* s2, size_t n) { |
| return _strnicmp(s1, s2, n); |
| } |
| inline size_t asccpyn(char* buffer, size_t buflen, |
| const char* source, size_t srclen = SIZE_UNKNOWN) { |
| return strcpyn(buffer, buflen, source, srclen); |
| } |
| |
| #ifdef WIN32 |
| |
| typedef wchar_t(*CharacterTransformation)(wchar_t); |
| inline wchar_t identity(wchar_t c) { return c; } |
| int ascii_string_compare(const wchar_t* s1, const char* s2, size_t n, |
| CharacterTransformation transformation); |
| |
| inline int asccmp(const wchar_t* s1, const char* s2) { |
| return ascii_string_compare(s1, s2, static_cast<size_t>(-1), identity); |
| } |
| inline int ascicmp(const wchar_t* s1, const char* s2) { |
| return ascii_string_compare(s1, s2, static_cast<size_t>(-1), tolowercase); |
| } |
| inline int ascncmp(const wchar_t* s1, const char* s2, size_t n) { |
| return ascii_string_compare(s1, s2, n, identity); |
| } |
| inline int ascnicmp(const wchar_t* s1, const char* s2, size_t n) { |
| return ascii_string_compare(s1, s2, n, tolowercase); |
| } |
| size_t asccpyn(wchar_t* buffer, size_t buflen, |
| const char* source, size_t srclen = SIZE_UNKNOWN); |
| |
| #endif // WIN32 |
| |
| /////////////////////////////////////////////////////////////////////////////// |
| // Traits<char> specializations |
| /////////////////////////////////////////////////////////////////////////////// |
| |
| template<> |
| struct Traits<char> { |
| typedef std::string string; |
| inline static const char* empty_str() { return ""; } |
| }; |
| |
| /////////////////////////////////////////////////////////////////////////////// |
| // Traits<wchar_t> specializations (Windows only, currently) |
| /////////////////////////////////////////////////////////////////////////////// |
| |
| #ifdef WIN32 |
| |
| template<> |
| struct Traits<wchar_t> { |
| typedef std::wstring string; |
| inline static const wchar_t* Traits<wchar_t>::empty_str() { return L""; } |
| }; |
| |
| #endif // WIN32 |
| |
| // Replaces all occurrences of "search" with "replace". |
| void replace_substrs(const char *search, |
| size_t search_len, |
| const char *replace, |
| size_t replace_len, |
| std::string *s); |
| |
| // True iff s1 starts with s2. |
| bool starts_with(const char *s1, const char *s2); |
| |
| // True iff s1 ends with s2. |
| bool ends_with(const char *s1, const char *s2); |
| |
| // Remove leading and trailing whitespaces. |
| std::string string_trim(const std::string& s); |
| |
| } // namespace talk_base |
| |
| #endif // TALK_BASE_STRINGUTILS_H__ |