/* $Id: string.h 18589 2009-04-01 09:11:02Z vboxsync $ */ /** @file * MS COM / XPCOM Abstraction Layer: * Smart string classes declaration */ /* * Copyright (C) 2006-2009 Sun Microsystems, Inc. * * This file is part of VirtualBox Open Source Edition (OSE), as * available from http://www.virtualbox.org. This file is free software; * you can redistribute it and/or modify it under the terms of the GNU * General Public License (GPL) as published by the Free Software * Foundation, in version 2 as it comes in the "COPYING" file of the * VirtualBox OSE distribution. VirtualBox OSE is distributed in the * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind. * * The contents of this file may alternatively be used under the terms * of the Common Development and Distribution License Version 1.0 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the * VirtualBox OSE distribution, in which case the provisions of the * CDDL are applicable instead of those of the GPL. * * You may elect to license modified versions of this file under the * terms and conditions of either the GPL or the CDDL or both. * * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa * Clara, CA 95054 USA or visit http://www.sun.com if you need * additional information or have any questions. */ #ifndef ___VBox_com_string_h #define ___VBox_com_string_h /* Make sure all the stdint.h macros are included - must come first! */ #ifndef __STDC_LIMIT_MACROS # define __STDC_LIMIT_MACROS #endif #ifndef __STDC_CONSTANT_MACROS # define __STDC_CONSTANT_MACROS #endif #if defined (VBOX_WITH_XPCOM) # include #endif #include "VBox/com/defs.h" #include "VBox/com/assert.h" #include #include #include namespace com { class Utf8Str; /** * Helper class that represents the |BSTR| type and hides platform-specific * implementation details. * * This class uses COM/XPCOM-provided memory management routines to allocate * and free string buffers. This makes it possible to: * - use it as a type of member variables of COM/XPCOM components and pass * their values to callers through component methods' output parameters * using the #cloneTo() operation; * - adopt (take ownership of) string buffers returned in output parameters * of COM methods using the #asOutParam() operation and correctly free them * afterwards. */ class Bstr { public: typedef BSTR String; typedef CBSTR ConstString; Bstr () : bstr (NULL) {} Bstr (const Bstr &that) : bstr (NULL) { raw_copy (bstr, that.bstr); } Bstr (CBSTR that) : bstr (NULL) { raw_copy (bstr, that); } #if defined (VBOX_WITH_XPCOM) Bstr (const wchar_t *that) : bstr (NULL) { AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR)); raw_copy (bstr, (CBSTR) that); } #endif Bstr (const Utf8Str &that); Bstr (const char *that); /** Shortcut that calls #alloc(aSize) right after object creation. */ Bstr (size_t aSize) : bstr (NULL) { alloc (aSize); } ~Bstr () { setNull(); } Bstr &operator = (const Bstr &that) { safe_assign (that.bstr); return *this; } Bstr &operator = (CBSTR that) { safe_assign (that); return *this; } Bstr &operator = (const Utf8Str &that); Bstr &operator = (const char *that); Bstr &setNull() { if (bstr) { ::SysFreeString (bstr); bstr = NULL; } return *this; } Bstr &setNullIfEmpty() { if (bstr && *bstr == 0) { ::SysFreeString (bstr); bstr = NULL; } return *this; } /** * Allocates memory for a string capable to store \a aSize - 1 characters; * in other words, aSize includes the terminating zero character. If \a aSize * is zero, or if a memory allocation error occurs, this object will become null. */ Bstr &alloc (size_t aSize) { setNull(); if (aSize) { unsigned int size = (unsigned int) aSize; Assert (size == aSize); bstr = ::SysAllocStringLen (NULL, size - 1); if (bstr) bstr [0] = 0; } return *this; } int compare (CBSTR str) const { return ::RTUtf16Cmp ((PRTUTF16) bstr, (PRTUTF16) str); } int compare (BSTR str) const { return ::RTUtf16Cmp ((PRTUTF16) bstr, (PRTUTF16) str); } bool operator == (const Bstr &that) const { return !compare (that.bstr); } bool operator != (const Bstr &that) const { return !!compare (that.bstr); } bool operator == (CBSTR that) const { return !compare (that); } bool operator == (BSTR that) const { return !compare (that); } #if defined (VBOX_WITH_XPCOM) bool operator != (const wchar_t *that) const { AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR)); return !!compare ((CBSTR) that); } bool operator == (const wchar_t *that) const { AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR)); return !compare ((CBSTR) that); } #endif bool operator != (CBSTR that) const { return !!compare (that); } bool operator != (BSTR that) const { return !!compare (that); } bool operator < (const Bstr &that) const { return compare (that.bstr) < 0; } bool operator < (CBSTR that) const { return compare (that) < 0; } bool operator < (BSTR that) const { return compare (that) < 0; } #if defined (VBOX_WITH_XPCOM) bool operator < (const wchar_t *that) const { AssertCompile (sizeof (wchar_t) == sizeof (OLECHAR)); return compare ((CBSTR) that) < 0; } #endif int compareIgnoreCase (CBSTR str) const { return ::RTUtf16LocaleICmp (bstr, str); } bool isNull() const { return bstr == NULL; } operator bool() const { return !isNull(); } bool isEmpty() const { return isNull() || *bstr == 0; } size_t length() const { return isNull() ? 0 : ::RTUtf16Len ((PRTUTF16) bstr); } /** Intended to to pass instances as |CBSTR| input parameters to methods. */ operator CBSTR () const { return bstr; } /** * Intended to to pass instances as |BSTR| input parameters to methods. * Note that we have to provide this mutable BSTR operator since in MS COM * input BSTR parameters of interface methods are not const. */ operator BSTR () { return bstr; } /** * The same as operator CBSTR(), but for situations where the compiler * cannot typecast implicitly (for example, in printf() argument list). */ CBSTR raw() const { return bstr; } /** * Returns a non-const raw pointer that allows to modify the string directly. * @warning * Be sure not to modify data beyond the allocated memory! The * guaranteed size of the allocated memory is at least #length() * bytes after creation and after every assignment operation. */ BSTR mutableRaw() { return bstr; } /** * Intended to assign copies of instances to |BSTR| out parameters from * within the interface method. Transfers the ownership of the duplicated * string to the caller. */ const Bstr &cloneTo (BSTR *pstr) const { if (pstr) { *pstr = NULL; raw_copy (*pstr, bstr); } return *this; } /** * Intended to assign instances to |BSTR| out parameters from within the * interface method. Transfers the ownership of the original string to the * caller and resets the instance to null. * * As opposed to cloneTo(), this method doesn't create a copy of the * string. */ Bstr &detachTo (BSTR *pstr) { *pstr = bstr; bstr = NULL; return *this; } /** * Intended to assign copies of instances to |char *| out parameters from * within the interface method. Transfers the ownership of the duplicated * string to the caller. */ const Bstr &cloneTo (char **pstr) const; /** * Intended to pass instances as |BSTR| out parameters to methods. * Takes the ownership of the returned data. */ BSTR *asOutParam() { setNull(); return &bstr; } /** * Static immutable null object. May be used for comparison purposes. */ static const Bstr Null; protected: void safe_assign (CBSTR str) { if (bstr != str) { setNull(); raw_copy (bstr, str); } } inline static void raw_copy (BSTR &ls, CBSTR rs) { if (rs) ls = ::SysAllocString ((const OLECHAR *) rs); } inline static void raw_copy (BSTR &ls, const char *rs) { if (rs) { PRTUTF16 s = NULL; ::RTStrToUtf16 (rs, &s); raw_copy (ls, (BSTR) s); ::RTUtf16Free (s); } } BSTR bstr; friend class Utf8Str; /* to access our raw_copy() */ }; /* symmetric compare operators */ inline bool operator== (CBSTR l, const Bstr &r) { return r.operator== (l); } inline bool operator!= (CBSTR l, const Bstr &r) { return r.operator!= (l); } inline bool operator== (BSTR l, const Bstr &r) { return r.operator== (l); } inline bool operator!= (BSTR l, const Bstr &r) { return r.operator!= (l); } //////////////////////////////////////////////////////////////////////////////// /** * Helper class that represents UTF8 (|char *|) strings. Useful in * conjunction with Bstr to simplify conversions between UTF16 (|BSTR|) * and UTF8. * * This class uses COM/XPCOM-provided memory management routines to allocate * and free string buffers. This makes it possible to: * - use it as a type of member variables of COM/XPCOM components and pass * their values to callers through component methods' output parameters * using the #cloneTo() operation; * - adopt (take ownership of) string buffers returned in output parameters * of COM methods using the #asOutParam() operation and correctly free them * afterwards. */ class Utf8Str { public: enum CaseSensitivity { CaseSensitive, CaseInsensitive }; typedef char *String; typedef const char *ConstString; Utf8Str () : str (NULL) {} Utf8Str (const Utf8Str &that) : str (NULL) { raw_copy (str, that.str); } Utf8Str (const char *that) : str (NULL) { raw_copy (str, that); } Utf8Str (const Bstr &that) : str (NULL) { raw_copy (str, that); } Utf8Str (CBSTR that) : str (NULL) { raw_copy (str, that); } /** Shortcut that calls #alloc(aSize) right after object creation. */ Utf8Str (size_t aSize) : str (NULL) { alloc(aSize); } virtual ~Utf8Str () { setNull(); } Utf8Str &operator = (const Utf8Str &that) { safe_assign (that.str); return *this; } Utf8Str &operator = (const char *that) { safe_assign (that); return *this; } Utf8Str &operator = (const Bstr &that) { setNull(); raw_copy (str, that); return *this; } Utf8Str &operator = (CBSTR that) { setNull(); raw_copy (str, that); return *this; } Utf8Str &setNull() { if (str) { #if !defined (VBOX_WITH_XPCOM) ::RTStrFree (str); #else nsMemory::Free (str); #endif str = NULL; } return *this; } Utf8Str &setNullIfEmpty() { if (str && *str == 0) { #if !defined (VBOX_WITH_XPCOM) ::RTStrFree (str); #else nsMemory::Free (str); #endif str = NULL; } return *this; } /** * Allocates memory for a string capable to store \a aSize - 1 bytes (not characters!); * in other words, aSize includes the terminating zero character. If \a aSize * is zero, or if a memory allocation error occurs, this object will become null. */ Utf8Str &alloc (size_t aSize) { setNull(); if (aSize) { #if !defined (VBOX_WITH_XPCOM) str = (char *) ::RTMemTmpAlloc (aSize); #else str = (char *) nsMemory::Alloc (aSize); #endif if (str) str [0] = 0; } return *this; } void append(const Utf8Str &that) { size_t cbThis = length(); size_t cbThat = that.length(); if (cbThat) { size_t cbBoth = cbThis + cbThat + 1; // @todo optimize with realloc() once the memory management is fixed char *pszTemp; #if !defined (VBOX_WITH_XPCOM) pszTemp = (char*)::RTMemTmpAlloc(cbBoth); #else pszTemp = (char*)nsMemory::Alloc(cbBoth); #endif if (str) { memcpy(pszTemp, str, cbThis); setNull(); } if (that.str) memcpy(pszTemp + cbThis, that.str, cbThat); pszTemp[cbThis + cbThat] = '\0'; str = pszTemp; } } int compare (const char *pcsz, CaseSensitivity cs = CaseSensitive) const { if (str == pcsz) return 0; if (str == NULL) return -1; if (pcsz == NULL) return 1; if (cs == CaseSensitive) return ::RTStrCmp(str, pcsz); else return ::RTStrICmp(str, pcsz); } int compare (const Utf8Str &that, CaseSensitivity cs = CaseSensitive) const { return compare (that.str, cs); } bool operator == (const Utf8Str &that) const { return !compare (that); } bool operator != (const Utf8Str &that) const { return !!compare (that); } bool operator == (const char *that) const { return !compare (that); } bool operator != (const char *that) const { return !!compare (that); } bool operator < (const Utf8Str &that) const { return compare (that) < 0; } bool operator < (const char *that) const { return compare (that) < 0; } bool endsWith (const Utf8Str &that, CaseSensitivity cs = CaseSensitive) const { if (isNull() || that.isNull()) return false; size_t l1 = length(); size_t l2 = that.length(); if (l1 < l2) return false; size_t l = l1 - l2; if (cs == CaseSensitive) return ::RTStrCmp(&str[l], that.str) == 0; else return ::RTStrICmp(&str[l], that.str) == 0; } bool startsWith (const Utf8Str &that, CaseSensitivity cs = CaseSensitive) const { if (isNull() || that.isNull()) return false; size_t l1 = length(); size_t l2 = that.length(); if (l1 < l2) return false; if (cs == CaseSensitive) return ::RTStrNCmp(str, that.str, l2) == 0; else return ::RTStrNICmp(str, that.str, l2) == 0; } bool contains (const Utf8Str &that, CaseSensitivity cs = CaseSensitive) const { if (cs == CaseSensitive) return ::RTStrStr (str, that.str) != NULL; else return ::RTStrIStr (str, that.str) != NULL; } Utf8Str& toLower() { if (isEmpty()) return *this; ::RTStrToLower(str); return *this; } Utf8Str& toUpper() { if (isEmpty()) return *this; ::RTStrToUpper(str); return *this; } bool isNull() const { return str == NULL; } operator bool() const { return !isNull(); } bool isEmpty() const { return isNull() || *str == 0; } size_t length() const { return isNull() ? 0 : ::strlen (str); } /** Intended to to pass instances as input (|char *|) parameters to methods. */ operator const char *() const { return str; } /** The same as operator const char *(), but for situations where the compiler cannot typecast implicitly (for example, in printf() argument list). */ const char *raw() const { return str; } /** The same as operator const char *(), but for situations where the compiler cannot typecast implicitly (for example, in printf() argument list). */ const char *c_str() const { return str; } /** * Returns a non-const raw pointer that allows to modify the string directly. * @warning * Be sure not to modify data beyond the allocated memory! The * guaranteed size of the allocated memory is at least #length() * bytes after creation and after every assignment operation. */ char *mutableRaw() { return str; } /** * Intended to assign instances to |char *| out parameters from within the * interface method. Transfers the ownership of the duplicated string to the * caller. */ const Utf8Str &cloneTo (char **pstr) const { if (pstr) { *pstr = NULL; raw_copy (*pstr, str); } return *this; } /** * Intended to assign instances to |char *| out parameters from within the * interface method. Transfers the ownership of the original string to the * caller and resets the instance to null. * * As opposed to cloneTo(), this method doesn't create a copy of the * string. */ Utf8Str &detachTo (char **pstr) { *pstr = str; str = NULL; return *this; } /** * Intended to assign instances to |BSTR| out parameters from within the * interface method. Transfers the ownership of the duplicated string to the * caller. */ const Utf8Str &cloneTo (BSTR *pstr) const { if (pstr) { *pstr = NULL; Bstr::raw_copy (*pstr, str); } return *this; } static const size_t npos; /** * Looks for pcszFind in "this" starting at "pos" and returns its position, * counting from the beginning of "this" at 0. Returns npos if not found. */ size_t find(const char *pcszFind, size_t pos = 0) const; /** * Returns a substring of "this" as a new Utf8Str. Works exactly like * its equivalent in std::string except that this interprets pos and n * as UTF-8 codepoints instead of bytes. With the default parameters "0" * and "npos", this always copies the entire string. * @param pos Index of first codepoint to copy from "this", counting from 0. * @param n Number of codepoints to copy, starting with the one at "pos". */ Utf8Str substr(size_t pos = 0, size_t n = npos) const; /** * Attempts to convert the member string into an 32-bit integer. * * @returns 32-bit unsigned number on success. * @returns 0 on failure. */ int toInt32() const { return RTStrToInt32(str); } /** * Attempts to convert the member string into an unsigned 32-bit integer. * * @returns 32-bit unsigned number on success. * @returns 0 on failure. */ int toUInt32() const { return RTStrToUInt32(str); } /** * Attempts to convert the member string into an 64-bit integer. * * @returns 64-bit unsigned number on success. * @returns 0 on failure. */ int64_t toInt64() const { return RTStrToInt64(str); } /** * Attempts to convert the member string into an unsigned 64-bit integer. * * @returns 64-bit unsigned number on success. * @returns 0 on failure. */ uint64_t toUInt64() const { return RTStrToUInt64(str); } /** * Attempts to convert the member string into an unsigned 64-bit integer. * @return IPRT error code. * @param i Output buffer. */ int toInt(uint64_t &i) const; /** * Attempts to convert the member string into an unsigned 32-bit integer. * @return IPRT error code. * @param i Output buffer. */ int toInt(uint32_t &i) const; /** * Intended to pass instances as out (|char **|) parameters to methods. * Takes the ownership of the returned data. */ char **asOutParam() { setNull(); return &str; } /** * Static immutable null object. May be used for comparison purposes. */ static const Utf8Str Null; protected: void safe_assign (const char *s) { if (str != s) { setNull(); raw_copy (str, s); } } inline static void raw_copy (char *&ls, const char *rs) { if (rs) #if !defined (VBOX_WITH_XPCOM) ::RTStrDupEx (&ls, rs); #else ls = (char *) nsMemory::Clone (rs, strlen (rs) + 1); #endif } inline static void raw_copy (char *&ls, CBSTR rs) { if (rs) { #if !defined (VBOX_WITH_XPCOM) ::RTUtf16ToUtf8 ((PRTUTF16) rs, &ls); #else char *s = NULL; ::RTUtf16ToUtf8 ((PRTUTF16) rs, &s); raw_copy (ls, s); ::RTStrFree (s); #endif } } char *str; friend class Bstr; /* to access our raw_copy() */ }; // symmetric compare operators inline bool operator== (const char *l, const Utf8Str &r) { return r.operator== (l); } inline bool operator!= (const char *l, const Utf8Str &r) { return r.operator!= (l); } // work around error C2593 of the stupid MSVC 7.x ambiguity resolver WORKAROUND_MSVC7_ERROR_C2593_FOR_BOOL_OP (Bstr) WORKAROUND_MSVC7_ERROR_C2593_FOR_BOOL_OP (Utf8Str) //////////////////////////////////////////////////////////////////////////////// // inlined Bstr members that depend on Utf8Str inline Bstr::Bstr (const Utf8Str &that) : bstr (NULL) { raw_copy (bstr, that); } inline Bstr::Bstr (const char *that) : bstr (NULL) { raw_copy (bstr, that); } inline Bstr &Bstr::operator = (const Utf8Str &that) { setNull(); raw_copy (bstr, that); return *this; } inline Bstr &Bstr::operator = (const char *that) { setNull(); raw_copy (bstr, that); return *this; } inline const Bstr &Bstr::cloneTo (char **pstr) const { if (pstr) { *pstr = NULL; Utf8Str::raw_copy (*pstr, bstr); } return *this; } //////////////////////////////////////////////////////////////////////////////// /** * This class is a printf-like formatter for Utf8Str strings. Its purpose is * to construct Utf8Str objects from a format string and a list of arguments * for the format string. * * The usage of this class is like the following: * * Utf8StrFmt string ("program name = %s", argv[0]); * */ class Utf8StrFmt : public Utf8Str { public: /** * Constructs a new string given the format string and the list * of the arguments for the format string. * * @param format printf-like format string (in UTF-8 encoding) * @param ... list of the arguments for the format string */ explicit Utf8StrFmt (const char *format, ...) { va_list args; va_start (args, format); init (format, args); va_end (args); } protected: Utf8StrFmt() {} void init (const char *format, va_list args); private: static DECLCALLBACK(size_t) strOutput (void *pvArg, const char *pachChars, size_t cbChars); }; /** * This class is a vprintf-like formatter for Utf8Str strings. It is * identical to Utf8StrFmt except that its constructor takes a va_list * argument instead of ellipsis. * * Note that a separate class is necessary because va_list is defined as * |char *| on most platforms. For this reason, if we had two overloaded * constructors in Utf8StrFmt (one taking ellipsis and another one taking * va_list) then composing a constructor call using exactly two |char *| * arguments would cause the compiler to use the va_list overload instead of * the ellipsis one which is obviously wrong. The compiler would choose * va_list because ellipsis has the lowest rank when it comes to resolving * overloads, as opposed to va_list which is an exact match for |char *|. */ class Utf8StrFmtVA : public Utf8StrFmt { public: /** * Constructs a new string given the format string and the list * of the arguments for the format string. * * @param format printf-like format string (in UTF-8 encoding) * @param args list of arguments for the format string */ Utf8StrFmtVA (const char *format, va_list args) { init (format, args); } }; /** * The BstrFmt class is a shortcut to Bstr (Utf8StrFmt (...)). */ class BstrFmt : public Bstr { public: /** * Constructs a new string given the format string and the list of the * arguments for the format string. * * @param aFormat printf-like format string (in UTF-8 encoding). * @param ... List of the arguments for the format string. */ explicit BstrFmt (const char *aFormat, ...) { va_list args; va_start (args, aFormat); raw_copy (bstr, Utf8StrFmtVA (aFormat, args)); va_end (args); } }; /** * The BstrFmtVA class is a shortcut to Bstr (Utf8StrFmtVA (...)). */ class BstrFmtVA : public Bstr { public: /** * Constructs a new string given the format string and the list of the * arguments for the format string. * * @param aFormat printf-like format string (in UTF-8 encoding). * @param aArgs List of arguments for the format string */ BstrFmtVA (const char *aFormat, va_list aArgs) { raw_copy (bstr, Utf8StrFmtVA (aFormat, aArgs)); } }; } /* namespace com */ #endif /* ___VBox_com_string_h */