/* * libjingle * Copyright 2004--2005, Google Inc. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * 1. Redistributions of source code must retain the above copyright notice, * this list of conditions and the following disclaimer. * 2. Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation * and/or other materials provided with the distribution. * 3. The name of the author may not be used to endorse or promote products * derived from this software without specific prior written permission. * * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #ifndef TALK_BASE_STRINGUTILS_H__ #define TALK_BASE_STRINGUTILS_H__ #include <ctype.h> #include <stdarg.h> #include <stdio.h> #ifdef WIN32 #include <malloc.h> #include <wchar.h> #define alloca _alloca #endif // WIN32 #ifdef POSIX #ifdef BSD #include <stdlib.h> #else // BSD #include <alloca.h> #endif // !BSD #endif // POSIX #include <cstring> #include <string> #include "talk/base/basictypes.h" /////////////////////////////////////////////////////////////////////////////// // Generic string/memory utilities /////////////////////////////////////////////////////////////////////////////// #define STACK_ARRAY(TYPE, LEN) static_cast<TYPE*>(::alloca((LEN)*sizeof(TYPE))) namespace talk_base { // Complement to memset. Verifies memory consists of count bytes of value c. bool memory_check(const void* memory, int c, size_t count); // Determines whether the simple wildcard pattern matches target. // Alpha characters in pattern match case-insensitively. // Asterisks in pattern match 0 or more characters. // Ex: string_match("www.TEST.GOOGLE.COM", "www.*.com") -> true bool string_match(const char* target, const char* pattern); } // namespace talk_base /////////////////////////////////////////////////////////////////////////////// // Rename a bunch of common string functions so they are consistent across // platforms and between char and wchar_t variants. // Here is the full list of functions that are unified: // strlen, strcmp, stricmp, strncmp, strnicmp // strchr, vsnprintf, strtoul, tolowercase // tolowercase is like tolower, but not compatible with end-of-file value // // It's not clear if we will ever use wchar_t strings on unix. In theory, // all strings should be Utf8 all the time, except when interfacing with Win32 // APIs that require Utf16. /////////////////////////////////////////////////////////////////////////////// inline char tolowercase(char c) { return static_cast<char>(tolower(c)); } #ifdef WIN32 inline size_t strlen(const wchar_t* s) { return wcslen(s); } inline int strcmp(const wchar_t* s1, const wchar_t* s2) { return wcscmp(s1, s2); } inline int stricmp(const wchar_t* s1, const wchar_t* s2) { return _wcsicmp(s1, s2); } inline int strncmp(const wchar_t* s1, const wchar_t* s2, size_t n) { return wcsncmp(s1, s2, n); } inline int strnicmp(const wchar_t* s1, const wchar_t* s2, size_t n) { return _wcsnicmp(s1, s2, n); } inline const wchar_t* strchr(const wchar_t* s, wchar_t c) { return wcschr(s, c); } inline const wchar_t* strstr(const wchar_t* haystack, const wchar_t* needle) { return wcsstr(haystack, needle); } #ifndef vsnprintf inline int vsnprintf(char* buf, size_t n, const char* fmt, va_list args) { return _vsnprintf(buf, n, fmt, args); } inline int vsnprintf(wchar_t* buf, size_t n, const wchar_t* fmt, va_list args) { return _vsnwprintf(buf, n, fmt, args); } #endif // !vsnprintf inline unsigned long strtoul(const wchar_t* snum, wchar_t** end, int base) { return wcstoul(snum, end, base); } inline wchar_t tolowercase(wchar_t c) { return static_cast<wchar_t>(towlower(c)); } #endif // WIN32 #ifdef POSIX inline int _stricmp(const char* s1, const char* s2) { return strcasecmp(s1, s2); } inline int _strnicmp(const char* s1, const char* s2, size_t n) { return strncasecmp(s1, s2, n); } #endif // POSIX /////////////////////////////////////////////////////////////////////////////// // Traits simplifies porting string functions to be CTYPE-agnostic /////////////////////////////////////////////////////////////////////////////// namespace talk_base { const size_t SIZE_UNKNOWN = static_cast<size_t>(-1); template<class CTYPE> struct Traits { // STL string type //typedef XXX string; // Null-terminated string //inline static const CTYPE* empty_str(); }; /////////////////////////////////////////////////////////////////////////////// // String utilities which work with char or wchar_t /////////////////////////////////////////////////////////////////////////////// template<class CTYPE> inline const CTYPE* nonnull(const CTYPE* str, const CTYPE* def_str = NULL) { return str ? str : (def_str ? def_str : Traits<CTYPE>::empty_str()); } template<class CTYPE> const CTYPE* strchr(const CTYPE* str, const CTYPE* chs) { for (size_t i=0; str[i]; ++i) { for (size_t j=0; chs[j]; ++j) { if (str[i] == chs[j]) { return str + i; } } } return 0; } template<class CTYPE> const CTYPE* strchrn(const CTYPE* str, size_t slen, CTYPE ch) { for (size_t i=0; i<slen && str[i]; ++i) { if (str[i] == ch) { return str + i; } } return 0; } template<class CTYPE> size_t strlenn(const CTYPE* buffer, size_t buflen) { size_t bufpos = 0; while (buffer[bufpos] && (bufpos < buflen)) { ++bufpos; } return bufpos; } // Safe versions of strncpy, strncat, snprintf and vsnprintf that always // null-terminate. template<class CTYPE> size_t strcpyn(CTYPE* buffer, size_t buflen, const CTYPE* source, size_t srclen = SIZE_UNKNOWN) { if (buflen <= 0) return 0; if (srclen == SIZE_UNKNOWN) { srclen = strlenn(source, buflen - 1); } else if (srclen >= buflen) { srclen = buflen - 1; } memcpy(buffer, source, srclen * sizeof(CTYPE)); buffer[srclen] = 0; return srclen; } template<class CTYPE> size_t strcatn(CTYPE* buffer, size_t buflen, const CTYPE* source, size_t srclen = SIZE_UNKNOWN) { if (buflen <= 0) return 0; size_t bufpos = strlenn(buffer, buflen - 1); return bufpos + strcpyn(buffer + bufpos, buflen - bufpos, source, srclen); } // Some compilers (clang specifically) require vsprintfn be defined before // sprintfn. template<class CTYPE> size_t vsprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, va_list args) { int len = vsnprintf(buffer, buflen, format, args); if ((len < 0) || (static_cast<size_t>(len) >= buflen)) { len = static_cast<int>(buflen - 1); buffer[len] = 0; } return len; } template<class CTYPE> size_t sprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, ...); /* This works to get GCC to notice printf argument mismatches, but then complains of missing implementation of sprintfn<char> template<> size_t sprintfn(char* buffer, size_t buflen, const char* format, ...) GCC_ATTR(format(printf,3,4)); */ template<class CTYPE> size_t sprintfn(CTYPE* buffer, size_t buflen, const CTYPE* format, ...) { va_list args; va_start(args, format); size_t len = vsprintfn(buffer, buflen, format, args); va_end(args); return len; } /////////////////////////////////////////////////////////////////////////////// // Allow safe comparing and copying ascii (not UTF-8) with both wide and // non-wide character strings. /////////////////////////////////////////////////////////////////////////////// inline int asccmp(const char* s1, const char* s2) { return strcmp(s1, s2); } inline int ascicmp(const char* s1, const char* s2) { return _stricmp(s1, s2); } inline int ascncmp(const char* s1, const char* s2, size_t n) { return strncmp(s1, s2, n); } inline int ascnicmp(const char* s1, const char* s2, size_t n) { return _strnicmp(s1, s2, n); } inline size_t asccpyn(char* buffer, size_t buflen, const char* source, size_t srclen = SIZE_UNKNOWN) { return strcpyn(buffer, buflen, source, srclen); } #ifdef WIN32 typedef wchar_t(*CharacterTransformation)(wchar_t); inline wchar_t identity(wchar_t c) { return c; } int ascii_string_compare(const wchar_t* s1, const char* s2, size_t n, CharacterTransformation transformation); inline int asccmp(const wchar_t* s1, const char* s2) { return ascii_string_compare(s1, s2, static_cast<size_t>(-1), identity); } inline int ascicmp(const wchar_t* s1, const char* s2) { return ascii_string_compare(s1, s2, static_cast<size_t>(-1), tolowercase); } inline int ascncmp(const wchar_t* s1, const char* s2, size_t n) { return ascii_string_compare(s1, s2, n, identity); } inline int ascnicmp(const wchar_t* s1, const char* s2, size_t n) { return ascii_string_compare(s1, s2, n, tolowercase); } size_t asccpyn(wchar_t* buffer, size_t buflen, const char* source, size_t srclen = SIZE_UNKNOWN); #endif // WIN32 /////////////////////////////////////////////////////////////////////////////// // Traits<char> specializations /////////////////////////////////////////////////////////////////////////////// template<> struct Traits<char> { typedef std::string string; inline static const char* empty_str() { return ""; } }; /////////////////////////////////////////////////////////////////////////////// // Traits<wchar_t> specializations (Windows only, currently) /////////////////////////////////////////////////////////////////////////////// #ifdef WIN32 template<> struct Traits<wchar_t> { typedef std::wstring string; inline static const wchar_t* Traits<wchar_t>::empty_str() { return L""; } }; #endif // WIN32 // Replaces all occurrences of "search" with "replace". void replace_substrs(const char *search, size_t search_len, const char *replace, size_t replace_len, std::string *s); // True iff s1 starts with s2. bool starts_with(const char *s1, const char *s2); // Remove leading and trailing whitespaces. std::string string_trim(const std::string& s); } // namespace talk_base #endif // TALK_BASE_STRINGUTILS_H__