VirtualBox

source: vbox/trunk/include/VBox/com/string.h@ 36882

Last change on this file since 36882 was 36527, checked in by vboxsync, 14 years ago

iprt::MiniString -> RTCString.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 19.2 KB
Line 
1/* $Id: string.h 36527 2011-04-04 13:16:09Z vboxsync $ */
2/** @file
3 * MS COM / XPCOM Abstraction Layer - Smart string classes declaration.
4 */
5
6/*
7 * Copyright (C) 2006-2011 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27#ifndef ___VBox_com_string_h
28#define ___VBox_com_string_h
29
30/* Make sure all the stdint.h macros are included - must come first! */
31#ifndef __STDC_LIMIT_MACROS
32# define __STDC_LIMIT_MACROS
33#endif
34#ifndef __STDC_CONSTANT_MACROS
35# define __STDC_CONSTANT_MACROS
36#endif
37
38#if defined(VBOX_WITH_XPCOM)
39# include <nsMemory.h>
40#endif
41
42#include "VBox/com/defs.h"
43#include "VBox/com/assert.h"
44
45#include <iprt/mem.h>
46#include <iprt/cpp/ministring.h>
47
48namespace com
49{
50
51class Utf8Str;
52
53// global constant in glue/string.cpp that represents an empty BSTR
54extern const BSTR g_bstrEmpty;
55
56/**
57 * String class used universally in Main for COM-style Utf-16 strings.
58 *
59 * Unfortunately COM on Windows uses UTF-16 everywhere, requiring conversions
60 * back and forth since most of VirtualBox and our libraries use UTF-8.
61 *
62 * To make things more obscure, on Windows, a COM-style BSTR is not just a
63 * pointer to a null-terminated wide character array, but the four bytes (32
64 * bits) BEFORE the memory that the pointer points to are a length DWORD. One
65 * must therefore avoid pointer arithmetic and always use SysAllocString and
66 * the like to deal with BSTR pointers, which manage that DWORD correctly.
67 *
68 * For platforms other than Windows, we provide our own versions of the Sys*
69 * functions in Main/xpcom/helpers.cpp which do NOT use length prefixes though
70 * to be compatible with how XPCOM allocates string parameters to public
71 * functions.
72 *
73 * The Bstr class hides all this handling behind a std::string-like interface
74 * and also provides automatic conversions to RTCString and Utf8Str instances.
75 *
76 * The one advantage of using the SysString* routines is that this makes it
77 * possible to use it as a type of member variables of COM/XPCOM components and
78 * pass their values to callers through component methods' output parameters
79 * using the #cloneTo() operation. Also, the class can adopt (take ownership
80 * of) string buffers returned in output parameters of COM methods using the
81 * #asOutParam() operation and correctly free them afterwards.
82 *
83 * Starting with VirtualBox 3.2, like Utf8Str, Bstr no longer differentiates
84 * between NULL strings and empty strings. In other words, Bstr("") and
85 * Bstr(NULL) behave the same. In both cases, Bstr allocates no memory,
86 * reports a zero length and zero allocated bytes for both, and returns an
87 * empty C wide string from raw().
88 *
89 * @note All Bstr methods ASSUMES valid UTF-16 or UTF-8 input strings.
90 * The VirtualBox policy in this regard is to validate strings coming
91 * from external sources before passing them to Bstr or Utf8Str.
92 */
93class Bstr
94{
95public:
96
97 Bstr()
98 : m_bstr(NULL)
99 { }
100
101 Bstr(const Bstr &that)
102 {
103 copyFrom((const OLECHAR *)that.m_bstr);
104 }
105
106 Bstr(CBSTR that)
107 {
108 copyFrom((const OLECHAR *)that);
109 }
110
111#if defined(VBOX_WITH_XPCOM)
112 Bstr(const wchar_t *that)
113 {
114 AssertCompile(sizeof(wchar_t) == sizeof(OLECHAR));
115 copyFrom((const OLECHAR *)that);
116 }
117#endif
118
119 Bstr(const RTCString &that)
120 {
121 copyFrom(that.c_str());
122 }
123
124 Bstr(const char *that)
125 {
126 copyFrom(that);
127 }
128
129 Bstr(const char *a_pThat, size_t a_cchMax)
130 {
131 copyFromN(a_pThat, a_cchMax);
132 }
133
134 ~Bstr()
135 {
136 setNull();
137 }
138
139 Bstr& operator=(const Bstr &that)
140 {
141 cleanup();
142 copyFrom((const OLECHAR *)that.m_bstr);
143 return *this;
144 }
145
146 Bstr& operator=(CBSTR that)
147 {
148 cleanup();
149 copyFrom((const OLECHAR *)that);
150 return *this;
151 }
152
153#if defined(VBOX_WITH_XPCOM)
154 Bstr& operator=(const wchar_t *that)
155 {
156 cleanup();
157 copyFrom((const OLECHAR *)that);
158 return *this;
159 }
160#endif
161
162 Bstr& setNull()
163 {
164 cleanup();
165 return *this;
166 }
167
168 RTMEMEF_NEW_AND_DELETE_OPERATORS();
169
170 /** Case sensitivity selector. */
171 enum CaseSensitivity
172 {
173 CaseSensitive,
174 CaseInsensitive
175 };
176
177 /**
178 * Compares the member string to str.
179 * @param str
180 * @param cs Whether comparison should be case-sensitive.
181 * @return
182 */
183 int compare(CBSTR str, CaseSensitivity cs = CaseSensitive) const
184 {
185 if (cs == CaseSensitive)
186 return ::RTUtf16Cmp((PRTUTF16)m_bstr, (PRTUTF16)str);
187 return ::RTUtf16LocaleICmp((PRTUTF16)m_bstr, (PRTUTF16)str);
188 }
189
190 int compare(BSTR str, CaseSensitivity cs = CaseSensitive) const
191 {
192 return compare((CBSTR)str, cs);
193 }
194
195 int compare(const Bstr &that, CaseSensitivity cs = CaseSensitive) const
196 {
197 return compare(that.m_bstr, cs);
198 }
199
200 bool operator==(const Bstr &that) const { return !compare(that.m_bstr); }
201 bool operator!=(const Bstr &that) const { return !!compare(that.m_bstr); }
202 bool operator==(CBSTR that) const { return !compare(that); }
203 bool operator==(BSTR that) const { return !compare(that); }
204
205 bool operator!=(CBSTR that) const { return !!compare(that); }
206 bool operator!=(BSTR that) const { return !!compare(that); }
207 bool operator<(const Bstr &that) const { return compare(that.m_bstr) < 0; }
208 bool operator<(CBSTR that) const { return compare(that) < 0; }
209 bool operator<(BSTR that) const { return compare(that) < 0; }
210
211 /**
212 * Returns true if the member string has no length.
213 * This is true for instances created from both NULL and "" input strings.
214 *
215 * @note Always use this method to check if an instance is empty. Do not
216 * use length() because that may need to run through the entire string
217 * (Bstr does not cache string lengths).
218 */
219 bool isEmpty() const { return m_bstr == NULL || *m_bstr == 0; }
220
221 /**
222 * Returns true if the member string has a length of one or more.
223 *
224 * @returns true if not empty, false if empty (NULL or "").
225 */
226 bool isNotEmpty() const { return m_bstr != NULL && *m_bstr != 0; }
227
228 size_t length() const { return isEmpty() ? 0 : ::RTUtf16Len((PRTUTF16)m_bstr); }
229
230#if defined(VBOX_WITH_XPCOM)
231 /**
232 * Returns a pointer to the raw member UTF-16 string. If the member string is empty,
233 * returns a pointer to a global variable containing an empty BSTR with a proper zero
234 * length prefix so that Windows is happy.
235 */
236 CBSTR raw() const
237 {
238 if (m_bstr)
239 return m_bstr;
240
241 return g_bstrEmpty;
242 }
243#else
244 /**
245 * Windows-only hack, as the automatically generated headers use BSTR.
246 * So if we don't want to cast like crazy we have to be more loose than
247 * on XPCOM.
248 *
249 * Returns a pointer to the raw member UTF-16 string. If the member string is empty,
250 * returns a pointer to a global variable containing an empty BSTR with a proper zero
251 * length prefix so that Windows is happy.
252 */
253 BSTR raw() const
254 {
255 if (m_bstr)
256 return m_bstr;
257
258 return g_bstrEmpty;
259 }
260#endif
261
262 /**
263 * Returns a non-const raw pointer that allows to modify the string directly.
264 * As opposed to raw(), this DOES return NULL if the member string is empty
265 * because we cannot return a mutable pointer to the global variable with the
266 * empty string.
267 *
268 * @warning
269 * Be sure not to modify data beyond the allocated memory! The
270 * guaranteed size of the allocated memory is at least #length()
271 * bytes after creation and after every assignment operation.
272 */
273 BSTR mutableRaw() { return m_bstr; }
274
275 /**
276 * Intended to assign copies of instances to |BSTR| out parameters from
277 * within the interface method. Transfers the ownership of the duplicated
278 * string to the caller.
279 *
280 * If the member string is empty, this allocates an empty BSTR in *pstr
281 * (i.e. makes it point to a new buffer with a null byte).
282 */
283 void cloneTo(BSTR *pstr) const
284 {
285 if (pstr)
286 {
287 *pstr = ::SysAllocString((const OLECHAR *)raw()); // raw() returns a pointer to "" if empty
288#ifdef RT_EXCEPTIONS_ENABLED
289 if (!*pstr)
290 throw std::bad_alloc();
291#endif
292 }
293 }
294
295 /**
296 * Intended to assign instances to |BSTR| out parameters from within the
297 * interface method. Transfers the ownership of the original string to the
298 * caller and resets the instance to null.
299 *
300 * As opposed to cloneTo(), this method doesn't create a copy of the
301 * string.
302 *
303 * If the member string is empty, this allocates an empty BSTR in *pstr
304 * (i.e. makes it point to a new buffer with a null byte).
305 *
306 * @param pbstrDst The BSTR variable to detach the string to.
307 *
308 * @throws std::bad_alloc if we failed to allocate a new empty string.
309 */
310 void detachTo(BSTR *pbstrDst)
311 {
312 if (m_bstr)
313 *pbstrDst = m_bstr;
314 else
315 {
316 // allocate null BSTR
317 *pbstrDst = ::SysAllocString((const OLECHAR *)g_bstrEmpty);
318#ifdef RT_EXCEPTIONS_ENABLED
319 if (!*pbstrDst)
320 throw std::bad_alloc();
321#endif
322 }
323 m_bstr = NULL;
324 }
325
326 /**
327 * Intended to pass instances as |BSTR| out parameters to methods.
328 * Takes the ownership of the returned data.
329 */
330 BSTR *asOutParam()
331 {
332 cleanup();
333 return &m_bstr;
334 }
335
336 /**
337 * Static immutable empty-string object. May be used for comparison purposes.
338 */
339 static const Bstr Empty;
340
341protected:
342
343 void cleanup()
344 {
345 if (m_bstr)
346 {
347 ::SysFreeString(m_bstr);
348 m_bstr = NULL;
349 }
350 }
351
352 /**
353 * Protected internal helper to copy a string. This ignores the previous object
354 * state, so either call this from a constructor or call cleanup() first.
355 *
356 * This variant copies from a zero-terminated UTF-16 string (which need not
357 * be a BSTR, i.e. need not have a length prefix).
358 *
359 * If the source is empty, this sets the member string to NULL.
360 *
361 * @param a_bstrSrc The source string. The caller guarantees
362 * that this is valid UTF-16.
363 *
364 * @throws std::bad_alloc - the object is representing an empty string.
365 */
366 void copyFrom(const OLECHAR *a_bstrSrc)
367 {
368 if (a_bstrSrc && *a_bstrSrc)
369 {
370 m_bstr = ::SysAllocString(a_bstrSrc);
371#ifdef RT_EXCEPTIONS_ENABLED
372 if (!m_bstr)
373 throw std::bad_alloc();
374#endif
375 }
376 else
377 m_bstr = NULL;
378 }
379
380 /**
381 * Protected internal helper to copy a string. This ignores the previous object
382 * state, so either call this from a constructor or call cleanup() first.
383 *
384 * This variant copies and converts from a zero-terminated UTF-8 string.
385 *
386 * If the source is empty, this sets the member string to NULL.
387 *
388 * @param a_pszSrc The source string. The caller guarantees
389 * that this is valid UTF-8.
390 *
391 * @throws std::bad_alloc - the object is representing an empty string.
392 */
393 void copyFrom(const char *a_pszSrc)
394 {
395 copyFromN(a_pszSrc, RTSTR_MAX);
396 }
397
398 /**
399 * Variant of copyFrom for sub-string constructors.
400 *
401 * @param a_pszSrc The source string. The caller guarantees
402 * that this is valid UTF-8.
403 * @param a_cchMax The maximum number of chars (not
404 * codepoints) to copy. If you pass RTSTR_MAX
405 * it'll be exactly like copyFrom().
406 *
407 * @throws std::bad_alloc - the object is representing an empty string.
408 */
409 void copyFromN(const char *a_pszSrc, size_t a_cchSrc);
410
411 BSTR m_bstr;
412
413 friend class Utf8Str; /* to access our raw_copy() */
414};
415
416/* symmetric compare operators */
417inline bool operator==(CBSTR l, const Bstr &r) { return r.operator==(l); }
418inline bool operator!=(CBSTR l, const Bstr &r) { return r.operator!=(l); }
419inline bool operator==(BSTR l, const Bstr &r) { return r.operator==(l); }
420inline bool operator!=(BSTR l, const Bstr &r) { return r.operator!=(l); }
421
422
423
424
425/**
426 * String class used universally in Main for UTF-8 strings.
427 *
428 * This is based on RTCString, to which some functionality has been
429 * moved. Here we keep things that are specific to Main, such as conversions
430 * with UTF-16 strings (Bstr).
431 *
432 * Like RTCString, Utf8Str does not differentiate between NULL strings
433 * and empty strings. In other words, Utf8Str("") and Utf8Str(NULL) behave the
434 * same. In both cases, RTCString allocates no memory, reports
435 * a zero length and zero allocated bytes for both, and returns an empty
436 * C string from c_str().
437 *
438 * @note All Utf8Str methods ASSUMES valid UTF-8 or UTF-16 input strings.
439 * The VirtualBox policy in this regard is to validate strings coming
440 * from external sources before passing them to Utf8Str or Bstr.
441 */
442class Utf8Str : public RTCString
443{
444public:
445
446 Utf8Str() {}
447
448 Utf8Str(const RTCString &that)
449 : RTCString(that)
450 {}
451
452 Utf8Str(const char *that)
453 : RTCString(that)
454 {}
455
456 Utf8Str(const Bstr &that)
457 {
458 copyFrom(that.raw());
459 }
460
461 Utf8Str(CBSTR that)
462 {
463 copyFrom(that);
464 }
465
466 /**
467 * Constructs a new string given the format string and the list of the
468 * arguments for the format string.
469 *
470 * @param a_pszFormat Pointer to the format string (UTF-8),
471 * @see pg_rt_str_format.
472 * @param a_va Argument vector containing the arguments
473 * specified by the format string.
474 * @sa RTCString::printfV
475 */
476 Utf8Str(const char *a_pszFormat, va_list a_va)
477 : RTCString(a_pszFormat, a_va)
478 {
479 }
480
481 Utf8Str& operator=(const RTCString &that)
482 {
483 RTCString::operator=(that);
484 return *this;
485 }
486
487 Utf8Str& operator=(const char *that)
488 {
489 RTCString::operator=(that);
490 return *this;
491 }
492
493 Utf8Str& operator=(const Bstr &that)
494 {
495 cleanup();
496 copyFrom(that.raw());
497 return *this;
498 }
499
500 Utf8Str& operator=(CBSTR that)
501 {
502 cleanup();
503 copyFrom(that);
504 return *this;
505 }
506
507 RTMEMEF_NEW_AND_DELETE_OPERATORS();
508
509#if defined(VBOX_WITH_XPCOM)
510 /**
511 * Intended to assign instances to |char *| out parameters from within the
512 * interface method. Transfers the ownership of the duplicated string to the
513 * caller.
514 *
515 * This allocates a single 0 byte in the target if the member string is empty.
516 *
517 * This uses XPCOM memory allocation and thus only works on XPCOM. MSCOM doesn't
518 * like char* strings anyway.
519 */
520 void cloneTo(char **pstr) const;
521#endif
522
523 /**
524 * Intended to assign instances to |BSTR| out parameters from within the
525 * interface method. Transfers the ownership of the duplicated string to the
526 * caller.
527 */
528 void cloneTo(BSTR *pstr) const
529 {
530 if (pstr)
531 {
532 Bstr bstr(*this);
533 bstr.cloneTo(pstr);
534 }
535 }
536
537 /**
538 * Removes a trailing slash from the member string, if present.
539 * Calls RTPathStripTrailingSlash() without having to mess with mutableRaw().
540 */
541 Utf8Str& stripTrailingSlash();
542
543 /**
544 * Removes a trailing filename from the member string, if present.
545 * Calls RTPathStripFilename() without having to mess with mutableRaw().
546 */
547 Utf8Str& stripFilename();
548
549 /**
550 * Removes the path component from the member string, if present.
551 * Calls RTPathFilename() without having to mess with mutableRaw().
552 */
553 Utf8Str& stripPath();
554
555 /**
556 * Removes a trailing file name extension from the member string, if present.
557 * Calls RTPathStripExt() without having to mess with mutableRaw().
558 */
559 Utf8Str& stripExt();
560
561 /**
562 * Static immutable empty-string object. May be used for comparison purposes.
563 */
564 static const Utf8Str Empty;
565
566protected:
567
568 void copyFrom(CBSTR a_pbstr);
569
570 friend class Bstr; /* to access our raw_copy() */
571};
572
573/**
574 * Class with RTCString::printf as constructor for your convenience.
575 *
576 * Constructing a Utf8Str string object from a format string and a variable
577 * number of arguments can easily be confused with the other Utf8Str
578 * constructures, thus this child class.
579 *
580 * The usage of this class is like the following:
581 * @code
582 Utf8StrFmt strName("program name = %s", argv[0]);
583 @endcode
584 */
585class Utf8StrFmt : public Utf8Str
586{
587public:
588
589 /**
590 * Constructs a new string given the format string and the list of the
591 * arguments for the format string.
592 *
593 * @param a_pszFormat Pointer to the format string (UTF-8),
594 * @see pg_rt_str_format.
595 * @param ... Ellipsis containing the arguments specified by
596 * the format string.
597 */
598 explicit Utf8StrFmt(const char *a_pszFormat, ...)
599 {
600 va_list va;
601 va_start(va, a_pszFormat);
602 printfV(a_pszFormat, va);
603 va_end(va);
604 }
605
606 RTMEMEF_NEW_AND_DELETE_OPERATORS();
607
608protected:
609 Utf8StrFmt()
610 { }
611
612private:
613};
614
615/**
616 * The BstrFmt class is a shortcut to <tt>Bstr(Utf8StrFmt(...))</tt>.
617 */
618class BstrFmt : public Bstr
619{
620public:
621
622 /**
623 * Constructs a new string given the format string and the list of the
624 * arguments for the format string.
625 *
626 * @param aFormat printf-like format string (in UTF-8 encoding).
627 * @param ... List of the arguments for the format string.
628 */
629 explicit BstrFmt(const char *aFormat, ...)
630 {
631 va_list args;
632 va_start(args, aFormat);
633 copyFrom(Utf8Str(aFormat, args).c_str());
634 va_end(args);
635 }
636
637 RTMEMEF_NEW_AND_DELETE_OPERATORS();
638};
639
640/**
641 * The BstrFmtVA class is a shortcut to <tt>Bstr(Utf8Str(format,va))</tt>.
642 */
643class BstrFmtVA : public Bstr
644{
645public:
646
647 /**
648 * Constructs a new string given the format string and the list of the
649 * arguments for the format string.
650 *
651 * @param aFormat printf-like format string (in UTF-8 encoding).
652 * @param aArgs List of arguments for the format string
653 */
654 BstrFmtVA(const char *aFormat, va_list aArgs)
655 {
656 copyFrom(Utf8Str(aFormat, aArgs).c_str());
657 }
658
659 RTMEMEF_NEW_AND_DELETE_OPERATORS();
660};
661
662} /* namespace com */
663
664#endif /* !___VBox_com_string_h */
665
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette