VirtualBox

source: vbox/trunk/include/VBox/com/string.h@ 80838

Last change on this file since 80838 was 80838, checked in by vboxsync, 6 years ago

Main/glue: Added an erase method identical to the one in RTCString.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 44.7 KB
Line 
1/* $Id: string.h 80838 2019-09-17 00:48:36Z vboxsync $ */
2/** @file
3 * MS COM / XPCOM Abstraction Layer - Smart string classes declaration.
4 */
5
6/*
7 * Copyright (C) 2006-2019 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27#ifndef VBOX_INCLUDED_com_string_h
28#define VBOX_INCLUDED_com_string_h
29#ifndef RT_WITHOUT_PRAGMA_ONCE
30# pragma once
31#endif
32
33/* Make sure all the stdint.h macros are included - must come first! */
34#ifndef __STDC_LIMIT_MACROS
35# define __STDC_LIMIT_MACROS
36#endif
37#ifndef __STDC_CONSTANT_MACROS
38# define __STDC_CONSTANT_MACROS
39#endif
40
41#if defined(VBOX_WITH_XPCOM)
42# include <nsMemory.h>
43#endif
44
45#include "VBox/com/defs.h"
46#include "VBox/com/assert.h"
47
48#include <iprt/mem.h>
49#include <iprt/utf16.h>
50#include <iprt/cpp/ministring.h>
51
52
53/** @defgroup grp_com_str Smart String Classes
54 * @ingroup grp_com
55 * @{
56 */
57
58namespace com
59{
60
61class Utf8Str;
62
63// global constant in glue/string.cpp that represents an empty BSTR
64extern const BSTR g_bstrEmpty;
65
66/**
67 * String class used universally in Main for COM-style Utf-16 strings.
68 *
69 * Unfortunately COM on Windows uses UTF-16 everywhere, requiring conversions
70 * back and forth since most of VirtualBox and our libraries use UTF-8.
71 *
72 * To make things more obscure, on Windows, a COM-style BSTR is not just a
73 * pointer to a null-terminated wide character array, but the four bytes (32
74 * bits) BEFORE the memory that the pointer points to are a length DWORD. One
75 * must therefore avoid pointer arithmetic and always use SysAllocString and
76 * the like to deal with BSTR pointers, which manage that DWORD correctly.
77 *
78 * For platforms other than Windows, we provide our own versions of the Sys*
79 * functions in Main/xpcom/helpers.cpp which do NOT use length prefixes though
80 * to be compatible with how XPCOM allocates string parameters to public
81 * functions.
82 *
83 * The Bstr class hides all this handling behind a std::string-like interface
84 * and also provides automatic conversions to RTCString and Utf8Str instances.
85 *
86 * The one advantage of using the SysString* routines is that this makes it
87 * possible to use it as a type of member variables of COM/XPCOM components and
88 * pass their values to callers through component methods' output parameters
89 * using the #cloneTo() operation. Also, the class can adopt (take ownership
90 * of) string buffers returned in output parameters of COM methods using the
91 * #asOutParam() operation and correctly free them afterwards.
92 *
93 * Starting with VirtualBox 3.2, like Utf8Str, Bstr no longer differentiates
94 * between NULL strings and empty strings. In other words, Bstr("") and
95 * Bstr(NULL) behave the same. In both cases, Bstr allocates no memory,
96 * reports a zero length and zero allocated bytes for both, and returns an
97 * empty C wide string from raw().
98 *
99 * @note All Bstr methods ASSUMES valid UTF-16 or UTF-8 input strings.
100 * The VirtualBox policy in this regard is to validate strings coming
101 * from external sources before passing them to Bstr or Utf8Str.
102 */
103class Bstr
104{
105public:
106
107 Bstr()
108 : m_bstr(NULL)
109 { }
110
111 Bstr(const Bstr &that)
112 {
113 copyFrom((const OLECHAR *)that.m_bstr);
114 }
115
116 Bstr(CBSTR that)
117 {
118 copyFrom((const OLECHAR *)that);
119 }
120
121#if defined(VBOX_WITH_XPCOM)
122 Bstr(const wchar_t *that)
123 {
124 AssertCompile(sizeof(wchar_t) == sizeof(OLECHAR));
125 copyFrom((const OLECHAR *)that);
126 }
127#endif
128
129 Bstr(const RTCString &that)
130 {
131 copyFrom(that.c_str());
132 }
133
134 Bstr(const char *that)
135 {
136 copyFrom(that);
137 }
138
139 Bstr(const char *a_pThat, size_t a_cchMax)
140 {
141 copyFromN(a_pThat, a_cchMax);
142 }
143
144 ~Bstr()
145 {
146 setNull();
147 }
148
149 Bstr &operator=(const Bstr &that)
150 {
151 cleanup();
152 copyFrom((const OLECHAR *)that.m_bstr);
153 return *this;
154 }
155
156 Bstr &operator=(CBSTR that)
157 {
158 cleanup();
159 copyFrom((const OLECHAR *)that);
160 return *this;
161 }
162
163#if defined(VBOX_WITH_XPCOM)
164 Bstr &operator=(const wchar_t *that)
165 {
166 cleanup();
167 copyFrom((const OLECHAR *)that);
168 return *this;
169 }
170#endif
171
172 Bstr &setNull()
173 {
174 cleanup();
175 return *this;
176 }
177
178#ifdef _MSC_VER
179# if _MSC_VER >= 1400
180 RTMEMEF_NEW_AND_DELETE_OPERATORS();
181# endif
182#else
183 RTMEMEF_NEW_AND_DELETE_OPERATORS();
184#endif
185
186 /** Case sensitivity selector. */
187 enum CaseSensitivity
188 {
189 CaseSensitive,
190 CaseInsensitive
191 };
192
193 /**
194 * Compares the member string to str.
195 * @param str
196 * @param cs Whether comparison should be case-sensitive.
197 * @return
198 */
199 int compare(CBSTR str, CaseSensitivity cs = CaseSensitive) const
200 {
201 if (cs == CaseSensitive)
202 return ::RTUtf16Cmp((PRTUTF16)m_bstr, (PRTUTF16)str);
203 return ::RTUtf16LocaleICmp((PRTUTF16)m_bstr, (PRTUTF16)str);
204 }
205
206 int compare(BSTR str, CaseSensitivity cs = CaseSensitive) const
207 {
208 return compare((CBSTR)str, cs);
209 }
210
211 int compare(const Bstr &that, CaseSensitivity cs = CaseSensitive) const
212 {
213 return compare(that.m_bstr, cs);
214 }
215
216 bool operator==(const Bstr &that) const { return !compare(that.m_bstr); }
217 bool operator==(CBSTR that) const { return !compare(that); }
218 bool operator==(BSTR that) const { return !compare(that); }
219 bool operator!=(const Bstr &that) const { return !!compare(that.m_bstr); }
220 bool operator!=(CBSTR that) const { return !!compare(that); }
221 bool operator!=(BSTR that) const { return !!compare(that); }
222 bool operator<(const Bstr &that) const { return compare(that.m_bstr) < 0; }
223 bool operator<(CBSTR that) const { return compare(that) < 0; }
224 bool operator<(BSTR that) const { return compare(that) < 0; }
225 bool operator<=(const Bstr &that) const { return compare(that.m_bstr) <= 0; }
226 bool operator<=(CBSTR that) const { return compare(that) <= 0; }
227 bool operator<=(BSTR that) const { return compare(that) <= 0; }
228 bool operator>(const Bstr &that) const { return compare(that.m_bstr) > 0; }
229 bool operator>(CBSTR that) const { return compare(that) > 0; }
230 bool operator>(BSTR that) const { return compare(that) > 0; }
231 bool operator>=(const Bstr &that) const { return compare(that.m_bstr) >= 0; }
232 bool operator>=(CBSTR that) const { return compare(that) >= 0; }
233 bool operator>=(BSTR that) const { return compare(that) >= 0; }
234
235 /**
236 * Compares this string to an UTF-8 C style string.
237 *
238 * @retval 0 if equal
239 * @retval -1 if this string is smaller than the UTF-8 one.
240 * @retval 1 if the UTF-8 string is smaller than this.
241 *
242 * @param a_pszRight The string to compare with.
243 * @param a_enmCase Whether comparison should be case-sensitive.
244 */
245 int compareUtf8(const char *a_pszRight, CaseSensitivity a_enmCase = CaseSensitive) const;
246
247 /** Java style compare method.
248 * @returns true if @a a_pszRight equals this string.
249 * @param a_pszRight The (UTF-8) string to compare with. */
250 bool equals(const char *a_pszRight) const { return compareUtf8(a_pszRight, CaseSensitive) == 0; }
251
252 /** Java style case-insensitive compare method.
253 * @returns true if @a a_pszRight equals this string.
254 * @param a_pszRight The (UTF-8) string to compare with. */
255 bool equalsIgnoreCase(const char *a_pszRight) const { return compareUtf8(a_pszRight, CaseInsensitive) == 0; }
256
257 /** Java style compare method.
258 * @returns true if @a a_rThat equals this string.
259 * @param a_rThat The other Bstr instance to compare with. */
260 bool equals(const Bstr &a_rThat) const { return compare(a_rThat.m_bstr, CaseSensitive) == 0; }
261 /** Java style case-insensitive compare method.
262 * @returns true if @a a_rThat equals this string.
263 * @param a_rThat The other Bstr instance to compare with. */
264 bool equalsIgnoreCase(const Bstr &a_rThat) const { return compare(a_rThat.m_bstr, CaseInsensitive) == 0; }
265
266 /** Java style compare method.
267 * @returns true if @a a_pThat equals this string.
268 * @param a_pThat The native const BSTR to compare with. */
269 bool equals(CBSTR a_pThat) const { return compare(a_pThat, CaseSensitive) == 0; }
270 /** Java style case-insensitive compare method.
271 * @returns true if @a a_pThat equals this string.
272 * @param a_pThat The native const BSTR to compare with. */
273 bool equalsIgnoreCase(CBSTR a_pThat) const { return compare(a_pThat, CaseInsensitive) == 0; }
274
275 /** Java style compare method.
276 * @returns true if @a a_pThat equals this string.
277 * @param a_pThat The native BSTR to compare with. */
278 bool equals(BSTR a_pThat) const { return compare(a_pThat, CaseSensitive) == 0; }
279 /** Java style case-insensitive compare method.
280 * @returns true if @a a_pThat equals this string.
281 * @param a_pThat The native BSTR to compare with. */
282 bool equalsIgnoreCase(BSTR a_pThat) const { return compare(a_pThat, CaseInsensitive) == 0; }
283
284 /**
285 * Returns true if the member string has no length.
286 * This is true for instances created from both NULL and "" input strings.
287 *
288 * @note Always use this method to check if an instance is empty. Do not
289 * use length() because that may need to run through the entire string
290 * (Bstr does not cache string lengths).
291 */
292 bool isEmpty() const { return m_bstr == NULL || *m_bstr == 0; }
293
294 /**
295 * Returns true if the member string has a length of one or more.
296 *
297 * @returns true if not empty, false if empty (NULL or "").
298 */
299 bool isNotEmpty() const { return m_bstr != NULL && *m_bstr != 0; }
300
301 size_t length() const { return isEmpty() ? 0 : ::RTUtf16Len((PRTUTF16)m_bstr); }
302
303 /**
304 * Assigns the output of the string format operation (RTStrPrintf).
305 *
306 * @param pszFormat Pointer to the format string,
307 * @see pg_rt_str_format.
308 * @param ... Ellipsis containing the arguments specified by
309 * the format string.
310 *
311 * @throws std::bad_alloc On allocation error. Object state is undefined.
312 *
313 * @returns Reference to the object.
314 */
315 Bstr &printf(const char *pszFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2);
316
317 /**
318 * Assigns the output of the string format operation (RTStrPrintf).
319 *
320 * @param pszFormat Pointer to the format string,
321 * @see pg_rt_str_format.
322 * @param ... Ellipsis containing the arguments specified by
323 * the format string.
324 *
325 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
326 */
327 HRESULT printfNoThrow(const char *pszFormat, ...) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 2);
328
329 /**
330 * Assigns the output of the string format operation (RTStrPrintfV).
331 *
332 * @param pszFormat Pointer to the format string,
333 * @see pg_rt_str_format.
334 * @param va Argument vector containing the arguments
335 * specified by the format string.
336 *
337 * @throws std::bad_alloc On allocation error. Object state is undefined.
338 *
339 * @returns Reference to the object.
340 */
341 Bstr &printfV(const char *pszFormat, va_list va) RT_IPRT_FORMAT_ATTR(1, 0);
342
343 /**
344 * Assigns the output of the string format operation (RTStrPrintfV).
345 *
346 * @param pszFormat Pointer to the format string,
347 * @see pg_rt_str_format.
348 * @param va Argument vector containing the arguments
349 * specified by the format string.
350 *
351 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
352 */
353 HRESULT printfVNoThrow(const char *pszFormat, va_list va) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 0);
354
355 /** @name Append methods and operators
356 * @{ */
357
358 /**
359 * Appends the string @a that to @a rThat.
360 *
361 * @param rThat The string to append.
362 * @throws std::bad_alloc On allocation error. The object is left unchanged.
363 * @returns Reference to the object.
364 */
365 Bstr &append(const Bstr &rThat);
366
367 /**
368 * Appends the string @a that to @a rThat.
369 *
370 * @param rThat The string to append.
371 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
372 */
373 HRESULT appendNoThrow(const Bstr &rThat) RT_NOEXCEPT;
374
375 /**
376 * Appends the UTF-8 string @a that to @a rThat.
377 *
378 * @param rThat The string to append.
379 * @throws std::bad_alloc On allocation error. The object is left unchanged.
380 * @returns Reference to the object.
381 */
382 Bstr &append(const RTCString &rThat);
383
384 /**
385 * Appends the UTF-8 string @a that to @a rThat.
386 *
387 * @param rThat The string to append.
388 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
389 */
390 HRESULT appendNoThrow(const RTCString &rThat) RT_NOEXCEPT;
391
392 /**
393 * Appends the UTF-16 string @a pszSrc to @a this.
394 *
395 * @param pwszSrc The C-style UTF-16 string to append.
396 * @throws std::bad_alloc On allocation error. The object is left unchanged.
397 * @returns Reference to the object.
398 */
399 Bstr &append(CBSTR pwszSrc);
400
401 /**
402 * Appends the UTF-16 string @a pszSrc to @a this.
403 *
404 * @param pwszSrc The C-style UTF-16 string to append.
405 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
406 */
407 HRESULT appendNoThrow(CBSTR pwszSrc) RT_NOEXCEPT;
408
409 /**
410 * Appends the UTF-8 string @a pszSrc to @a this.
411 *
412 * @param pszSrc The C-style string to append.
413 * @throws std::bad_alloc On allocation error. The object is left unchanged.
414 * @returns Reference to the object.
415 */
416 Bstr &append(const char *pszSrc);
417
418 /**
419 * Appends the UTF-8 string @a pszSrc to @a this.
420 *
421 * @param pszSrc The C-style string to append.
422 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
423 */
424 HRESULT appendNoThrow(const char *pszSrc) RT_NOEXCEPT;
425
426 /**
427 * Appends the a substring from @a rThat to @a this.
428 *
429 * @param rThat The string to append a substring from.
430 * @param offStart The start of the substring to append (UTF-16
431 * offset, not codepoint).
432 * @param cwcMax The maximum number of UTF-16 units to append.
433 * @throws std::bad_alloc On allocation error. The object is left unchanged.
434 * @returns Reference to the object.
435 */
436 Bstr &append(const Bstr &rThat, size_t offStart, size_t cwcMax = RTSTR_MAX);
437
438 /**
439 * Appends the a substring from @a rThat to @a this.
440 *
441 * @param rThat The string to append a substring from.
442 * @param offStart The start of the substring to append (UTF-16
443 * offset, not codepoint).
444 * @param cwcMax The maximum number of UTF-16 units to append.
445 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
446 */
447 HRESULT appendNoThrow(const Bstr &rThat, size_t offStart, size_t cwcMax = RTSTR_MAX) RT_NOEXCEPT;
448
449 /**
450 * Appends the a substring from UTF-8 @a rThat to @a this.
451 *
452 * @param rThat The string to append a substring from.
453 * @param offStart The start of the substring to append (byte offset,
454 * not codepoint).
455 * @param cchMax The maximum number of bytes to append.
456 * @throws std::bad_alloc On allocation error. The object is left unchanged.
457 * @returns Reference to the object.
458 */
459 Bstr &append(const RTCString &rThat, size_t offStart, size_t cchMax = RTSTR_MAX);
460
461 /**
462 * Appends the a substring from UTF-8 @a rThat to @a this.
463 *
464 * @param rThat The string to append a substring from.
465 * @param offStart The start of the substring to append (byte offset,
466 * not codepoint).
467 * @param cchMax The maximum number of bytes to append.
468 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
469 */
470 HRESULT appendNoThrow(const RTCString &rThat, size_t offStart, size_t cchMax = RTSTR_MAX) RT_NOEXCEPT;
471
472 /**
473 * Appends the first @a cchMax chars from UTF-16 string @a pszThat to @a this.
474 *
475 * @param pwszThat The C-style UTF-16 string to append.
476 * @param cchMax The maximum number of bytes to append.
477 * @throws std::bad_alloc On allocation error. The object is left unchanged.
478 * @returns Reference to the object.
479 */
480 Bstr &append(CBSTR pwszThat, size_t cchMax);
481
482 /**
483 * Appends the first @a cchMax chars from UTF-16 string @a pszThat to @a this.
484 *
485 * @param pwszThat The C-style UTF-16 string to append.
486 * @param cchMax The maximum number of bytes to append.
487 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
488 */
489 HRESULT appendNoThrow(CBSTR pwszThat, size_t cchMax) RT_NOEXCEPT;
490
491 /**
492 * Appends the first @a cchMax chars from string @a pszThat to @a this.
493 *
494 * @param pszThat The C-style string to append.
495 * @param cchMax The maximum number of bytes to append.
496 * @throws std::bad_alloc On allocation error. The object is left unchanged.
497 * @returns Reference to the object.
498 */
499 Bstr &append(const char *pszThat, size_t cchMax);
500
501 /**
502 * Appends the first @a cchMax chars from string @a pszThat to @a this.
503 *
504 * @param pszThat The C-style string to append.
505 * @param cchMax The maximum number of bytes to append.
506 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
507 */
508 HRESULT appendNoThrow(const char *pszThat, size_t cchMax) RT_NOEXCEPT;
509
510 /**
511 * Appends the given character to @a this.
512 *
513 * @param ch The character to append.
514 * @throws std::bad_alloc On allocation error. The object is left unchanged.
515 * @returns Reference to the object.
516 */
517 Bstr &append(char ch);
518
519 /**
520 * Appends the given character to @a this.
521 *
522 * @param ch The character to append.
523 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
524 */
525 HRESULT appendNoThrow(char ch) RT_NOEXCEPT;
526
527 /**
528 * Appends the given unicode code point to @a this.
529 *
530 * @param uc The unicode code point to append.
531 * @throws std::bad_alloc On allocation error. The object is left unchanged.
532 * @returns Reference to the object.
533 */
534 Bstr &appendCodePoint(RTUNICP uc);
535
536 /**
537 * Appends the given unicode code point to @a this.
538 *
539 * @param uc The unicode code point to append.
540 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
541 */
542 HRESULT appendCodePointNoThrow(RTUNICP uc) RT_NOEXCEPT;
543
544 /**
545 * Appends the output of the string format operation (RTStrPrintf).
546 *
547 * @param pszFormat Pointer to the format string,
548 * @see pg_rt_str_format.
549 * @param ... Ellipsis containing the arguments specified by
550 * the format string.
551 *
552 * @throws std::bad_alloc On allocation error. Object state is undefined.
553 *
554 * @returns Reference to the object.
555 */
556 Bstr &appendPrintf(const char *pszFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2);
557
558 /**
559 * Appends the output of the string format operation (RTStrPrintf).
560 *
561 * @param pszFormat Pointer to the format string,
562 * @see pg_rt_str_format.
563 * @param ... Ellipsis containing the arguments specified by
564 * the format string.
565 *
566 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
567 */
568 HRESULT appendPrintfNoThrow(const char *pszFormat, ...) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 2);
569
570 /**
571 * Appends the output of the string format operation (RTStrPrintfV).
572 *
573 * @param pszFormat Pointer to the format string,
574 * @see pg_rt_str_format.
575 * @param va Argument vector containing the arguments
576 * specified by the format string.
577 *
578 * @throws std::bad_alloc On allocation error. Object state is undefined.
579 *
580 * @returns Reference to the object.
581 */
582 Bstr &appendPrintfV(const char *pszFormat, va_list va) RT_IPRT_FORMAT_ATTR(1, 0);
583
584 /**
585 * Appends the output of the string format operation (RTStrPrintfV).
586 *
587 * @param pszFormat Pointer to the format string,
588 * @see pg_rt_str_format.
589 * @param va Argument vector containing the arguments
590 * specified by the format string.
591 *
592 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
593 */
594 HRESULT appendPrintfVNoThrow(const char *pszFormat, va_list va) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 0);
595
596 /**
597 * Shortcut to append(), Bstr variant.
598 *
599 * @param rThat The string to append.
600 * @returns Reference to the object.
601 */
602 Bstr &operator+=(const Bstr &rThat)
603 {
604 return append(rThat);
605 }
606
607 /**
608 * Shortcut to append(), RTCString variant.
609 *
610 * @param rThat The string to append.
611 * @returns Reference to the object.
612 */
613 Bstr &operator+=(const RTCString &rThat)
614 {
615 return append(rThat);
616 }
617
618 /**
619 * Shortcut to append(), CBSTR variant.
620 *
621 * @param pwszThat The C-style string to append.
622 * @returns Reference to the object.
623 */
624 Bstr &operator+=(CBSTR pwszThat)
625 {
626 return append(pwszThat);
627 }
628
629 /**
630 * Shortcut to append(), const char * variant.
631 *
632 * @param pszThat The C-style string to append.
633 * @returns Reference to the object.
634 */
635 Bstr &operator+=(const char *pszThat)
636 {
637 return append(pszThat);
638 }
639
640 /**
641 * Shortcut to append(), char variant.
642 *
643 * @param ch The character to append.
644 *
645 * @returns Reference to the object.
646 */
647 Bstr &operator+=(char ch)
648 {
649 return append(ch);
650 }
651
652 /** @} */
653
654 /**
655 * Erases a sequence from the string.
656 *
657 * @returns Reference to the object.
658 * @param offStart Where in @a this string to start erasing (UTF-16
659 * units, not codepoints).
660 * @param cwcLength How much following @a offStart to erase (UTF-16
661 * units, not codepoints).
662 */
663 Bstr &erase(size_t offStart = 0, size_t cwcLength = RTSTR_MAX) RT_NOEXCEPT;
664
665
666#if defined(VBOX_WITH_XPCOM)
667 /**
668 * Returns a pointer to the raw member UTF-16 string. If the member string is empty,
669 * returns a pointer to a global variable containing an empty BSTR with a proper zero
670 * length prefix so that Windows is happy.
671 */
672 CBSTR raw() const
673 {
674 if (m_bstr)
675 return m_bstr;
676
677 return g_bstrEmpty;
678 }
679#else
680 /**
681 * Windows-only hack, as the automatically generated headers use BSTR.
682 * So if we don't want to cast like crazy we have to be more loose than
683 * on XPCOM.
684 *
685 * Returns a pointer to the raw member UTF-16 string. If the member string is empty,
686 * returns a pointer to a global variable containing an empty BSTR with a proper zero
687 * length prefix so that Windows is happy.
688 */
689 BSTR raw() const
690 {
691 if (m_bstr)
692 return m_bstr;
693
694 return g_bstrEmpty;
695 }
696#endif
697
698 /**
699 * Returns a non-const raw pointer that allows modifying the string directly.
700 *
701 * @note As opposed to raw(), this DOES return NULL if the member string is
702 * empty because we cannot return a mutable pointer to the global variable
703 * with the empty string.
704 *
705 * @note If modifying the string size (only shrinking it is allows), #jolt() or
706 * #joltNoThrow() must be called!
707 *
708 * @note Do not modify memory beyond the #length() of the string!
709 *
710 * @sa joltNoThrow(), mutalbleRaw(), reserve(), reserveNoThrow()
711 */
712 BSTR mutableRaw() { return m_bstr; }
713
714 /**
715 * Correct the embedded length after using mutableRaw().
716 *
717 * This is needed on COM (Windows) to update the embedded string length. It is
718 * a stub on hosts using XPCOM.
719 *
720 * @param cwcNew The new string length, if handy, otherwise a negative
721 * number.
722 * @sa joltNoThrow(), mutalbleRaw(), reserve(), reserveNoThrow()
723 */
724#ifndef VBOX_WITH_XPCOM
725 void jolt(ssize_t cwcNew = -1);
726#else
727 void jolt(ssize_t cwcNew = -1)
728 {
729 Assert(cwcNew < 0 || (cwcNew == 0 && !m_bstr) || m_bstr[cwcNew] == '\0'); RT_NOREF(cwcNew);
730 }
731#endif
732
733 /**
734 * Correct the embedded length after using mutableRaw().
735 *
736 * This is needed on COM (Windows) to update the embedded string length. It is
737 * a stub on hosts using XPCOM.
738 *
739 * @returns S_OK on success, E_OUTOFMEMORY if shrinking the string failed.
740 * @param cwcNew The new string length, if handy, otherwise a negative
741 * number.
742 * @sa jolt(), mutalbleRaw(), reserve(), reserveNoThrow()
743 */
744#ifndef VBOX_WITH_XPCOM
745 HRESULT joltNoThrow(ssize_t cwcNew = -1) RT_NOEXCEPT;
746#else
747 HRESULT joltNoThrow(ssize_t cwcNew = -1) RT_NOEXCEPT
748 {
749 Assert(cwcNew < 0 || (cwcNew == 0 && !m_bstr) || m_bstr[cwcNew] == '\0'); RT_NOREF(cwcNew);
750 return S_OK;
751 }
752#endif
753
754 /**
755 * Make sure at that least @a cwc of buffer space is reserved.
756 *
757 * Requests that the contained memory buffer have at least cb bytes allocated.
758 * This may expand or shrink the string's storage, but will never truncate the
759 * contained string. In other words, cb will be ignored if it's smaller than
760 * length() + 1.
761 *
762 * @param cwcMin The new minimum string length that the can be stored. This
763 * does not include the terminator.
764 * @param fForce Force this size.
765 *
766 * @throws std::bad_alloc On allocation error. The object is left unchanged.
767 */
768 void reserve(size_t cwcMin, bool fForce = false);
769
770 /**
771 * A C like version of the #reserve() method, i.e. return code instead of throw.
772 *
773 * @returns S_OK or E_OUTOFMEMORY.
774 * @param cwcMin The new minimum string length that the can be stored. This
775 * does not include the terminator.
776 * @param fForce Force this size.
777 */
778 HRESULT reserveNoThrow(size_t cwcMin, bool fForce = false) RT_NOEXCEPT;
779
780 /**
781 * Intended to assign copies of instances to |BSTR| out parameters from
782 * within the interface method. Transfers the ownership of the duplicated
783 * string to the caller.
784 *
785 * If the member string is empty, this allocates an empty BSTR in *pstr
786 * (i.e. makes it point to a new buffer with a null byte).
787 *
788 * @deprecated Use cloneToEx instead to avoid throwing exceptions.
789 */
790 void cloneTo(BSTR *pstr) const
791 {
792 if (pstr)
793 {
794 *pstr = ::SysAllocString((const OLECHAR *)raw()); // raw() returns a pointer to "" if empty
795#ifdef RT_EXCEPTIONS_ENABLED
796 if (!*pstr)
797 throw std::bad_alloc();
798#endif
799 }
800 }
801
802 /**
803 * A version of cloneTo that does not throw any out of memory exceptions, but
804 * returns E_OUTOFMEMORY intead.
805 * @returns S_OK or E_OUTOFMEMORY.
806 */
807 HRESULT cloneToEx(BSTR *pstr) const
808 {
809 if (!pstr)
810 return S_OK;
811 *pstr = ::SysAllocString((const OLECHAR *)raw()); // raw() returns a pointer to "" if empty
812 return pstr ? S_OK : E_OUTOFMEMORY;
813 }
814
815 /**
816 * Intended to assign instances to |BSTR| out parameters from within the
817 * interface method. Transfers the ownership of the original string to the
818 * caller and resets the instance to null.
819 *
820 * As opposed to cloneTo(), this method doesn't create a copy of the
821 * string.
822 *
823 * If the member string is empty, this allocates an empty BSTR in *pstr
824 * (i.e. makes it point to a new buffer with a null byte).
825 *
826 * @param pbstrDst The BSTR variable to detach the string to.
827 *
828 * @throws std::bad_alloc if we failed to allocate a new empty string.
829 */
830 void detachTo(BSTR *pbstrDst)
831 {
832 if (m_bstr)
833 {
834 *pbstrDst = m_bstr;
835 m_bstr = NULL;
836 }
837 else
838 {
839 // allocate null BSTR
840 *pbstrDst = ::SysAllocString((const OLECHAR *)g_bstrEmpty);
841#ifdef RT_EXCEPTIONS_ENABLED
842 if (!*pbstrDst)
843 throw std::bad_alloc();
844#endif
845 }
846 }
847
848 /**
849 * A version of detachTo that does not throw exceptions on out-of-memory
850 * conditions, but instead returns E_OUTOFMEMORY.
851 *
852 * @param pbstrDst The BSTR variable to detach the string to.
853 * @returns S_OK or E_OUTOFMEMORY.
854 */
855 HRESULT detachToEx(BSTR *pbstrDst)
856 {
857 if (m_bstr)
858 {
859 *pbstrDst = m_bstr;
860 m_bstr = NULL;
861 }
862 else
863 {
864 // allocate null BSTR
865 *pbstrDst = ::SysAllocString((const OLECHAR *)g_bstrEmpty);
866 if (!*pbstrDst)
867 return E_OUTOFMEMORY;
868 }
869 return S_OK;
870 }
871
872 /**
873 * Intended to pass instances as |BSTR| out parameters to methods.
874 * Takes the ownership of the returned data.
875 */
876 BSTR *asOutParam()
877 {
878 cleanup();
879 return &m_bstr;
880 }
881
882 /**
883 * Static immutable empty-string object. May be used for comparison purposes.
884 */
885 static const Bstr Empty;
886
887protected:
888
889 void cleanup()
890 {
891 if (m_bstr)
892 {
893 ::SysFreeString(m_bstr);
894 m_bstr = NULL;
895 }
896 }
897
898 /**
899 * Protected internal helper to copy a string. This ignores the previous object
900 * state, so either call this from a constructor or call cleanup() first.
901 *
902 * This variant copies from a zero-terminated UTF-16 string (which need not
903 * be a BSTR, i.e. need not have a length prefix).
904 *
905 * If the source is empty, this sets the member string to NULL.
906 *
907 * @param a_bstrSrc The source string. The caller guarantees
908 * that this is valid UTF-16.
909 *
910 * @throws std::bad_alloc - the object is representing an empty string.
911 */
912 void copyFrom(const OLECHAR *a_bstrSrc)
913 {
914 if (a_bstrSrc && *a_bstrSrc)
915 {
916 m_bstr = ::SysAllocString(a_bstrSrc);
917#ifdef RT_EXCEPTIONS_ENABLED
918 if (!m_bstr)
919 throw std::bad_alloc();
920#endif
921 }
922 else
923 m_bstr = NULL;
924 }
925
926 /**
927 * Protected internal helper to copy a string. This ignores the previous object
928 * state, so either call this from a constructor or call cleanup() first.
929 *
930 * This variant copies and converts from a zero-terminated UTF-8 string.
931 *
932 * If the source is empty, this sets the member string to NULL.
933 *
934 * @param a_pszSrc The source string. The caller guarantees
935 * that this is valid UTF-8.
936 *
937 * @throws std::bad_alloc - the object is representing an empty string.
938 */
939 void copyFrom(const char *a_pszSrc)
940 {
941 copyFromN(a_pszSrc, RTSTR_MAX);
942 }
943
944 /**
945 * Variant of copyFrom for sub-string constructors.
946 *
947 * @param a_pszSrc The source string. The caller guarantees
948 * that this is valid UTF-8.
949 * @param a_cchSrc The maximum number of chars (not codepoints) to
950 * copy. If you pass RTSTR_MAX it'll be exactly
951 * like copyFrom().
952 *
953 * @throws std::bad_alloc - the object is representing an empty string.
954 */
955 void copyFromN(const char *a_pszSrc, size_t a_cchSrc);
956
957 Bstr &appendWorkerUtf16(PCRTUTF16 pwszSrc, size_t cwcSrc);
958 Bstr &appendWorkerUtf8(const char *pszSrc, size_t cchSrc);
959 HRESULT appendWorkerUtf16NoThrow(PCRTUTF16 pwszSrc, size_t cwcSrc) RT_NOEXCEPT;
960 HRESULT appendWorkerUtf8NoThrow(const char *pszSrc, size_t cchSrc) RT_NOEXCEPT;
961
962 static DECLCALLBACK(size_t) printfOutputCallbackNoThrow(void *pvArg, const char *pachChars, size_t cbChars) RT_NOEXCEPT;
963
964 BSTR m_bstr;
965
966 friend class Utf8Str; /* to access our raw_copy() */
967};
968
969/* symmetric compare operators */
970inline bool operator==(CBSTR l, const Bstr &r) { return r.operator==(l); }
971inline bool operator!=(CBSTR l, const Bstr &r) { return r.operator!=(l); }
972inline bool operator==(BSTR l, const Bstr &r) { return r.operator==(l); }
973inline bool operator!=(BSTR l, const Bstr &r) { return r.operator!=(l); }
974
975
976
977
978/**
979 * String class used universally in Main for UTF-8 strings.
980 *
981 * This is based on RTCString, to which some functionality has been
982 * moved. Here we keep things that are specific to Main, such as conversions
983 * with UTF-16 strings (Bstr).
984 *
985 * Like RTCString, Utf8Str does not differentiate between NULL strings
986 * and empty strings. In other words, Utf8Str("") and Utf8Str(NULL) behave the
987 * same. In both cases, RTCString allocates no memory, reports
988 * a zero length and zero allocated bytes for both, and returns an empty
989 * C string from c_str().
990 *
991 * @note All Utf8Str methods ASSUMES valid UTF-8 or UTF-16 input strings.
992 * The VirtualBox policy in this regard is to validate strings coming
993 * from external sources before passing them to Utf8Str or Bstr.
994 */
995class Utf8Str : public RTCString
996{
997public:
998
999 Utf8Str() {}
1000
1001 Utf8Str(const RTCString &that)
1002 : RTCString(that)
1003 {}
1004
1005 Utf8Str(const char *that)
1006 : RTCString(that)
1007 {}
1008
1009 Utf8Str(const Bstr &that)
1010 {
1011 copyFrom(that.raw());
1012 }
1013
1014 Utf8Str(CBSTR that, size_t a_cwcSize = RTSTR_MAX)
1015 {
1016 copyFrom(that, a_cwcSize);
1017 }
1018
1019 Utf8Str(const char *a_pszSrc, size_t a_cchSrc)
1020 : RTCString(a_pszSrc, a_cchSrc)
1021 {
1022 }
1023
1024 /**
1025 * Constructs a new string given the format string and the list of the
1026 * arguments for the format string.
1027 *
1028 * @param a_pszFormat Pointer to the format string (UTF-8),
1029 * @see pg_rt_str_format.
1030 * @param a_va Argument vector containing the arguments
1031 * specified by the format string.
1032 * @sa RTCString::printfV
1033 */
1034 Utf8Str(const char *a_pszFormat, va_list a_va) RT_IPRT_FORMAT_ATTR(1, 0)
1035 : RTCString(a_pszFormat, a_va)
1036 {
1037 }
1038
1039 Utf8Str& operator=(const RTCString &that)
1040 {
1041 RTCString::operator=(that);
1042 return *this;
1043 }
1044
1045 Utf8Str& operator=(const char *that)
1046 {
1047 RTCString::operator=(that);
1048 return *this;
1049 }
1050
1051 Utf8Str& operator=(const Bstr &that)
1052 {
1053 cleanup();
1054 copyFrom(that.raw());
1055 return *this;
1056 }
1057
1058 Utf8Str& operator=(CBSTR that)
1059 {
1060 cleanup();
1061 copyFrom(that);
1062 return *this;
1063 }
1064
1065 /**
1066 * Extended assignment method that returns a COM status code instead of an
1067 * exception on failure.
1068 *
1069 * @returns S_OK or E_OUTOFMEMORY.
1070 * @param a_rSrcStr The source string
1071 */
1072 HRESULT assignEx(Utf8Str const &a_rSrcStr)
1073 {
1074 return copyFromExNComRC(a_rSrcStr.m_psz, 0, a_rSrcStr.m_cch);
1075 }
1076
1077 /**
1078 * Extended assignment method that returns a COM status code instead of an
1079 * exception on failure.
1080 *
1081 * @returns S_OK, E_OUTOFMEMORY or E_INVALIDARG.
1082 * @param a_rSrcStr The source string
1083 * @param a_offSrc The character (byte) offset of the substring.
1084 * @param a_cchSrc The number of characters (bytes) to copy from the source
1085 * string.
1086 */
1087 HRESULT assignEx(Utf8Str const &a_rSrcStr, size_t a_offSrc, size_t a_cchSrc)
1088 {
1089 if ( a_offSrc + a_cchSrc > a_rSrcStr.m_cch
1090 || a_offSrc > a_rSrcStr.m_cch)
1091 return E_INVALIDARG;
1092 return copyFromExNComRC(a_rSrcStr.m_psz, a_offSrc, a_cchSrc);
1093 }
1094
1095 /**
1096 * Extended assignment method that returns a COM status code instead of an
1097 * exception on failure.
1098 *
1099 * @returns S_OK or E_OUTOFMEMORY.
1100 * @param a_pcszSrc The source string
1101 */
1102 HRESULT assignEx(const char *a_pcszSrc)
1103 {
1104 return copyFromExNComRC(a_pcszSrc, 0, a_pcszSrc ? strlen(a_pcszSrc) : 0);
1105 }
1106
1107 /**
1108 * Extended assignment method that returns a COM status code instead of an
1109 * exception on failure.
1110 *
1111 * @returns S_OK or E_OUTOFMEMORY.
1112 * @param a_pcszSrc The source string
1113 * @param a_cchSrc The number of characters (bytes) to copy from the source
1114 * string.
1115 */
1116 HRESULT assignEx(const char *a_pcszSrc, size_t a_cchSrc)
1117 {
1118 return copyFromExNComRC(a_pcszSrc, 0, a_cchSrc);
1119 }
1120
1121 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1122
1123#if defined(VBOX_WITH_XPCOM)
1124 /**
1125 * Intended to assign instances to |char *| out parameters from within the
1126 * interface method. Transfers the ownership of the duplicated string to the
1127 * caller.
1128 *
1129 * This allocates a single 0 byte in the target if the member string is empty.
1130 *
1131 * This uses XPCOM memory allocation and thus only works on XPCOM. MSCOM doesn't
1132 * like char* strings anyway.
1133 */
1134 void cloneTo(char **pstr) const;
1135
1136 /**
1137 * A version of cloneTo that does not throw allocation errors but returns
1138 * E_OUTOFMEMORY instead.
1139 * @returns S_OK or E_OUTOFMEMORY (COM status codes).
1140 */
1141 HRESULT cloneToEx(char **pstr) const;
1142#endif
1143
1144 /**
1145 * Intended to assign instances to |BSTR| out parameters from within the
1146 * interface method. Transfers the ownership of the duplicated string to the
1147 * caller.
1148 */
1149 void cloneTo(BSTR *pstr) const
1150 {
1151 if (pstr)
1152 {
1153 Bstr bstr(*this);
1154 bstr.cloneTo(pstr);
1155 }
1156 }
1157
1158 /**
1159 * A version of cloneTo that does not throw allocation errors but returns
1160 * E_OUTOFMEMORY instead.
1161 *
1162 * @param pbstr Where to store a clone of the string.
1163 * @returns S_OK or E_OUTOFMEMORY (COM status codes).
1164 */
1165 HRESULT cloneToEx(BSTR *pbstr) const
1166 {
1167 if (!pbstr)
1168 return S_OK;
1169 Bstr bstr(*this);
1170 return bstr.detachToEx(pbstr);
1171 }
1172
1173 /**
1174 * Safe assignment from BSTR.
1175 *
1176 * @param pbstrSrc The source string.
1177 * @returns S_OK or E_OUTOFMEMORY (COM status codes).
1178 */
1179 HRESULT cloneEx(CBSTR pbstrSrc)
1180 {
1181 cleanup();
1182 return copyFromEx(pbstrSrc);
1183 }
1184
1185 /**
1186 * Removes a trailing slash from the member string, if present.
1187 * Calls RTPathStripTrailingSlash() without having to mess with mutableRaw().
1188 */
1189 Utf8Str& stripTrailingSlash();
1190
1191 /**
1192 * Removes a trailing filename from the member string, if present.
1193 * Calls RTPathStripFilename() without having to mess with mutableRaw().
1194 */
1195 Utf8Str& stripFilename();
1196
1197 /**
1198 * Removes the path component from the member string, if present.
1199 * Calls RTPathFilename() without having to mess with mutableRaw().
1200 */
1201 Utf8Str& stripPath();
1202
1203 /**
1204 * Removes a trailing file name suffix from the member string, if present.
1205 * Calls RTPathStripSuffix() without having to mess with mutableRaw().
1206 */
1207 Utf8Str& stripSuffix();
1208
1209 /**
1210 * Parses key=value pairs.
1211 *
1212 * @returns offset of the @a a_rPairSeparator following the returned value.
1213 * @retval npos is returned if there are no more key/value pairs.
1214 *
1215 * @param a_rKey Reference to variable that should receive
1216 * the key substring. This is set to null if
1217 * no key/value found. (It's also possible the
1218 * key is an empty string, so be careful.)
1219 * @param a_rValue Reference to variable that should receive
1220 * the value substring. This is set to null if
1221 * no key/value found. (It's also possible the
1222 * value is an empty string, so be careful.)
1223 * @param a_offStart The offset to start searching from. This is
1224 * typically 0 for the first call, and the
1225 * return value of the previous call for the
1226 * subsequent ones.
1227 * @param a_rPairSeparator The pair separator string. If this is an
1228 * empty string, the whole string will be
1229 * considered as a single key/value pair.
1230 * @param a_rKeyValueSeparator The key/value separator string.
1231 */
1232 size_t parseKeyValue(Utf8Str &a_rKey, Utf8Str &a_rValue, size_t a_offStart = 0,
1233 const Utf8Str &a_rPairSeparator = ",", const Utf8Str &a_rKeyValueSeparator = "=") const;
1234
1235 /**
1236 * Static immutable empty-string object. May be used for comparison purposes.
1237 */
1238 static const Utf8Str Empty;
1239protected:
1240
1241 void copyFrom(CBSTR a_pbstr, size_t a_cwcMax = RTSTR_MAX);
1242 HRESULT copyFromEx(CBSTR a_pbstr);
1243 HRESULT copyFromExNComRC(const char *a_pcszSrc, size_t a_offSrc, size_t a_cchSrc);
1244
1245 friend class Bstr; /* to access our raw_copy() */
1246};
1247
1248/**
1249 * Class with RTCString::printf as constructor for your convenience.
1250 *
1251 * Constructing a Utf8Str string object from a format string and a variable
1252 * number of arguments can easily be confused with the other Utf8Str
1253 * constructures, thus this child class.
1254 *
1255 * The usage of this class is like the following:
1256 * @code
1257 Utf8StrFmt strName("program name = %s", argv[0]);
1258 @endcode
1259 */
1260class Utf8StrFmt : public Utf8Str
1261{
1262public:
1263
1264 /**
1265 * Constructs a new string given the format string and the list of the
1266 * arguments for the format string.
1267 *
1268 * @param a_pszFormat Pointer to the format string (UTF-8),
1269 * @see pg_rt_str_format.
1270 * @param ... Ellipsis containing the arguments specified by
1271 * the format string.
1272 */
1273 explicit Utf8StrFmt(const char *a_pszFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2)
1274 {
1275 va_list va;
1276 va_start(va, a_pszFormat);
1277 printfV(a_pszFormat, va);
1278 va_end(va);
1279 }
1280
1281 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1282
1283protected:
1284 Utf8StrFmt()
1285 { }
1286
1287private:
1288};
1289
1290/**
1291 * The BstrFmt class is a shortcut to <tt>Bstr(Utf8StrFmt(...))</tt>.
1292 */
1293class BstrFmt : public Bstr
1294{
1295public:
1296
1297 /**
1298 * Constructs a new string given the format string and the list of the
1299 * arguments for the format string.
1300 *
1301 * @param aFormat printf-like format string (in UTF-8 encoding).
1302 * @param ... List of the arguments for the format string.
1303 */
1304 explicit BstrFmt(const char *aFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2)
1305 {
1306 va_list args;
1307 va_start(args, aFormat);
1308 copyFrom(Utf8Str(aFormat, args).c_str());
1309 va_end(args);
1310 }
1311
1312 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1313};
1314
1315/**
1316 * The BstrFmtVA class is a shortcut to <tt>Bstr(Utf8Str(format,va))</tt>.
1317 */
1318class BstrFmtVA : public Bstr
1319{
1320public:
1321
1322 /**
1323 * Constructs a new string given the format string and the list of the
1324 * arguments for the format string.
1325 *
1326 * @param aFormat printf-like format string (in UTF-8 encoding).
1327 * @param aArgs List of arguments for the format string
1328 */
1329 BstrFmtVA(const char *aFormat, va_list aArgs) RT_IPRT_FORMAT_ATTR(1, 0)
1330 {
1331 copyFrom(Utf8Str(aFormat, aArgs).c_str());
1332 }
1333
1334 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1335};
1336
1337} /* namespace com */
1338
1339/** @} */
1340
1341#endif /* !VBOX_INCLUDED_com_string_h */
1342
Note: See TracBrowser for help on using the repository browser.

© 2025 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette