VirtualBox

source: vbox/trunk/include/VBox/com/string.h@ 80836

Last change on this file since 80836 was 80836, checked in by vboxsync, 6 years ago

Main/glue: Added all the append methods that RTCString have and then some.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 44.2 KB
Line 
1/* $Id: string.h 80836 2019-09-17 00:26:52Z vboxsync $ */
2/** @file
3 * MS COM / XPCOM Abstraction Layer - Smart string classes declaration.
4 */
5
6/*
7 * Copyright (C) 2006-2019 Oracle Corporation
8 *
9 * This file is part of VirtualBox Open Source Edition (OSE), as
10 * available from http://www.virtualbox.org. This file is free software;
11 * you can redistribute it and/or modify it under the terms of the GNU
12 * General Public License (GPL) as published by the Free Software
13 * Foundation, in version 2 as it comes in the "COPYING" file of the
14 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
15 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
16 *
17 * The contents of this file may alternatively be used under the terms
18 * of the Common Development and Distribution License Version 1.0
19 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
20 * VirtualBox OSE distribution, in which case the provisions of the
21 * CDDL are applicable instead of those of the GPL.
22 *
23 * You may elect to license modified versions of this file under the
24 * terms and conditions of either the GPL or the CDDL or both.
25 */
26
27#ifndef VBOX_INCLUDED_com_string_h
28#define VBOX_INCLUDED_com_string_h
29#ifndef RT_WITHOUT_PRAGMA_ONCE
30# pragma once
31#endif
32
33/* Make sure all the stdint.h macros are included - must come first! */
34#ifndef __STDC_LIMIT_MACROS
35# define __STDC_LIMIT_MACROS
36#endif
37#ifndef __STDC_CONSTANT_MACROS
38# define __STDC_CONSTANT_MACROS
39#endif
40
41#if defined(VBOX_WITH_XPCOM)
42# include <nsMemory.h>
43#endif
44
45#include "VBox/com/defs.h"
46#include "VBox/com/assert.h"
47
48#include <iprt/mem.h>
49#include <iprt/utf16.h>
50#include <iprt/cpp/ministring.h>
51
52
53/** @defgroup grp_com_str Smart String Classes
54 * @ingroup grp_com
55 * @{
56 */
57
58namespace com
59{
60
61class Utf8Str;
62
63// global constant in glue/string.cpp that represents an empty BSTR
64extern const BSTR g_bstrEmpty;
65
66/**
67 * String class used universally in Main for COM-style Utf-16 strings.
68 *
69 * Unfortunately COM on Windows uses UTF-16 everywhere, requiring conversions
70 * back and forth since most of VirtualBox and our libraries use UTF-8.
71 *
72 * To make things more obscure, on Windows, a COM-style BSTR is not just a
73 * pointer to a null-terminated wide character array, but the four bytes (32
74 * bits) BEFORE the memory that the pointer points to are a length DWORD. One
75 * must therefore avoid pointer arithmetic and always use SysAllocString and
76 * the like to deal with BSTR pointers, which manage that DWORD correctly.
77 *
78 * For platforms other than Windows, we provide our own versions of the Sys*
79 * functions in Main/xpcom/helpers.cpp which do NOT use length prefixes though
80 * to be compatible with how XPCOM allocates string parameters to public
81 * functions.
82 *
83 * The Bstr class hides all this handling behind a std::string-like interface
84 * and also provides automatic conversions to RTCString and Utf8Str instances.
85 *
86 * The one advantage of using the SysString* routines is that this makes it
87 * possible to use it as a type of member variables of COM/XPCOM components and
88 * pass their values to callers through component methods' output parameters
89 * using the #cloneTo() operation. Also, the class can adopt (take ownership
90 * of) string buffers returned in output parameters of COM methods using the
91 * #asOutParam() operation and correctly free them afterwards.
92 *
93 * Starting with VirtualBox 3.2, like Utf8Str, Bstr no longer differentiates
94 * between NULL strings and empty strings. In other words, Bstr("") and
95 * Bstr(NULL) behave the same. In both cases, Bstr allocates no memory,
96 * reports a zero length and zero allocated bytes for both, and returns an
97 * empty C wide string from raw().
98 *
99 * @note All Bstr methods ASSUMES valid UTF-16 or UTF-8 input strings.
100 * The VirtualBox policy in this regard is to validate strings coming
101 * from external sources before passing them to Bstr or Utf8Str.
102 */
103class Bstr
104{
105public:
106
107 Bstr()
108 : m_bstr(NULL)
109 { }
110
111 Bstr(const Bstr &that)
112 {
113 copyFrom((const OLECHAR *)that.m_bstr);
114 }
115
116 Bstr(CBSTR that)
117 {
118 copyFrom((const OLECHAR *)that);
119 }
120
121#if defined(VBOX_WITH_XPCOM)
122 Bstr(const wchar_t *that)
123 {
124 AssertCompile(sizeof(wchar_t) == sizeof(OLECHAR));
125 copyFrom((const OLECHAR *)that);
126 }
127#endif
128
129 Bstr(const RTCString &that)
130 {
131 copyFrom(that.c_str());
132 }
133
134 Bstr(const char *that)
135 {
136 copyFrom(that);
137 }
138
139 Bstr(const char *a_pThat, size_t a_cchMax)
140 {
141 copyFromN(a_pThat, a_cchMax);
142 }
143
144 ~Bstr()
145 {
146 setNull();
147 }
148
149 Bstr &operator=(const Bstr &that)
150 {
151 cleanup();
152 copyFrom((const OLECHAR *)that.m_bstr);
153 return *this;
154 }
155
156 Bstr &operator=(CBSTR that)
157 {
158 cleanup();
159 copyFrom((const OLECHAR *)that);
160 return *this;
161 }
162
163#if defined(VBOX_WITH_XPCOM)
164 Bstr &operator=(const wchar_t *that)
165 {
166 cleanup();
167 copyFrom((const OLECHAR *)that);
168 return *this;
169 }
170#endif
171
172 Bstr &setNull()
173 {
174 cleanup();
175 return *this;
176 }
177
178#ifdef _MSC_VER
179# if _MSC_VER >= 1400
180 RTMEMEF_NEW_AND_DELETE_OPERATORS();
181# endif
182#else
183 RTMEMEF_NEW_AND_DELETE_OPERATORS();
184#endif
185
186 /** Case sensitivity selector. */
187 enum CaseSensitivity
188 {
189 CaseSensitive,
190 CaseInsensitive
191 };
192
193 /**
194 * Compares the member string to str.
195 * @param str
196 * @param cs Whether comparison should be case-sensitive.
197 * @return
198 */
199 int compare(CBSTR str, CaseSensitivity cs = CaseSensitive) const
200 {
201 if (cs == CaseSensitive)
202 return ::RTUtf16Cmp((PRTUTF16)m_bstr, (PRTUTF16)str);
203 return ::RTUtf16LocaleICmp((PRTUTF16)m_bstr, (PRTUTF16)str);
204 }
205
206 int compare(BSTR str, CaseSensitivity cs = CaseSensitive) const
207 {
208 return compare((CBSTR)str, cs);
209 }
210
211 int compare(const Bstr &that, CaseSensitivity cs = CaseSensitive) const
212 {
213 return compare(that.m_bstr, cs);
214 }
215
216 bool operator==(const Bstr &that) const { return !compare(that.m_bstr); }
217 bool operator==(CBSTR that) const { return !compare(that); }
218 bool operator==(BSTR that) const { return !compare(that); }
219 bool operator!=(const Bstr &that) const { return !!compare(that.m_bstr); }
220 bool operator!=(CBSTR that) const { return !!compare(that); }
221 bool operator!=(BSTR that) const { return !!compare(that); }
222 bool operator<(const Bstr &that) const { return compare(that.m_bstr) < 0; }
223 bool operator<(CBSTR that) const { return compare(that) < 0; }
224 bool operator<(BSTR that) const { return compare(that) < 0; }
225 bool operator<=(const Bstr &that) const { return compare(that.m_bstr) <= 0; }
226 bool operator<=(CBSTR that) const { return compare(that) <= 0; }
227 bool operator<=(BSTR that) const { return compare(that) <= 0; }
228 bool operator>(const Bstr &that) const { return compare(that.m_bstr) > 0; }
229 bool operator>(CBSTR that) const { return compare(that) > 0; }
230 bool operator>(BSTR that) const { return compare(that) > 0; }
231 bool operator>=(const Bstr &that) const { return compare(that.m_bstr) >= 0; }
232 bool operator>=(CBSTR that) const { return compare(that) >= 0; }
233 bool operator>=(BSTR that) const { return compare(that) >= 0; }
234
235 /**
236 * Compares this string to an UTF-8 C style string.
237 *
238 * @retval 0 if equal
239 * @retval -1 if this string is smaller than the UTF-8 one.
240 * @retval 1 if the UTF-8 string is smaller than this.
241 *
242 * @param a_pszRight The string to compare with.
243 * @param a_enmCase Whether comparison should be case-sensitive.
244 */
245 int compareUtf8(const char *a_pszRight, CaseSensitivity a_enmCase = CaseSensitive) const;
246
247 /** Java style compare method.
248 * @returns true if @a a_pszRight equals this string.
249 * @param a_pszRight The (UTF-8) string to compare with. */
250 bool equals(const char *a_pszRight) const { return compareUtf8(a_pszRight, CaseSensitive) == 0; }
251
252 /** Java style case-insensitive compare method.
253 * @returns true if @a a_pszRight equals this string.
254 * @param a_pszRight The (UTF-8) string to compare with. */
255 bool equalsIgnoreCase(const char *a_pszRight) const { return compareUtf8(a_pszRight, CaseInsensitive) == 0; }
256
257 /** Java style compare method.
258 * @returns true if @a a_rThat equals this string.
259 * @param a_rThat The other Bstr instance to compare with. */
260 bool equals(const Bstr &a_rThat) const { return compare(a_rThat.m_bstr, CaseSensitive) == 0; }
261 /** Java style case-insensitive compare method.
262 * @returns true if @a a_rThat equals this string.
263 * @param a_rThat The other Bstr instance to compare with. */
264 bool equalsIgnoreCase(const Bstr &a_rThat) const { return compare(a_rThat.m_bstr, CaseInsensitive) == 0; }
265
266 /** Java style compare method.
267 * @returns true if @a a_pThat equals this string.
268 * @param a_pThat The native const BSTR to compare with. */
269 bool equals(CBSTR a_pThat) const { return compare(a_pThat, CaseSensitive) == 0; }
270 /** Java style case-insensitive compare method.
271 * @returns true if @a a_pThat equals this string.
272 * @param a_pThat The native const BSTR to compare with. */
273 bool equalsIgnoreCase(CBSTR a_pThat) const { return compare(a_pThat, CaseInsensitive) == 0; }
274
275 /** Java style compare method.
276 * @returns true if @a a_pThat equals this string.
277 * @param a_pThat The native BSTR to compare with. */
278 bool equals(BSTR a_pThat) const { return compare(a_pThat, CaseSensitive) == 0; }
279 /** Java style case-insensitive compare method.
280 * @returns true if @a a_pThat equals this string.
281 * @param a_pThat The native BSTR to compare with. */
282 bool equalsIgnoreCase(BSTR a_pThat) const { return compare(a_pThat, CaseInsensitive) == 0; }
283
284 /**
285 * Returns true if the member string has no length.
286 * This is true for instances created from both NULL and "" input strings.
287 *
288 * @note Always use this method to check if an instance is empty. Do not
289 * use length() because that may need to run through the entire string
290 * (Bstr does not cache string lengths).
291 */
292 bool isEmpty() const { return m_bstr == NULL || *m_bstr == 0; }
293
294 /**
295 * Returns true if the member string has a length of one or more.
296 *
297 * @returns true if not empty, false if empty (NULL or "").
298 */
299 bool isNotEmpty() const { return m_bstr != NULL && *m_bstr != 0; }
300
301 size_t length() const { return isEmpty() ? 0 : ::RTUtf16Len((PRTUTF16)m_bstr); }
302
303 /**
304 * Assigns the output of the string format operation (RTStrPrintf).
305 *
306 * @param pszFormat Pointer to the format string,
307 * @see pg_rt_str_format.
308 * @param ... Ellipsis containing the arguments specified by
309 * the format string.
310 *
311 * @throws std::bad_alloc On allocation error. Object state is undefined.
312 *
313 * @returns Reference to the object.
314 */
315 Bstr &printf(const char *pszFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2);
316
317 /**
318 * Assigns the output of the string format operation (RTStrPrintf).
319 *
320 * @param pszFormat Pointer to the format string,
321 * @see pg_rt_str_format.
322 * @param ... Ellipsis containing the arguments specified by
323 * the format string.
324 *
325 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
326 */
327 HRESULT printfNoThrow(const char *pszFormat, ...) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 2);
328
329 /**
330 * Assigns the output of the string format operation (RTStrPrintfV).
331 *
332 * @param pszFormat Pointer to the format string,
333 * @see pg_rt_str_format.
334 * @param va Argument vector containing the arguments
335 * specified by the format string.
336 *
337 * @throws std::bad_alloc On allocation error. Object state is undefined.
338 *
339 * @returns Reference to the object.
340 */
341 Bstr &printfV(const char *pszFormat, va_list va) RT_IPRT_FORMAT_ATTR(1, 0);
342
343 /**
344 * Assigns the output of the string format operation (RTStrPrintfV).
345 *
346 * @param pszFormat Pointer to the format string,
347 * @see pg_rt_str_format.
348 * @param va Argument vector containing the arguments
349 * specified by the format string.
350 *
351 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
352 */
353 HRESULT printfVNoThrow(const char *pszFormat, va_list va) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 0);
354
355 /** @name Append methods and operators
356 * @{ */
357
358 /**
359 * Appends the string @a that to @a rThat.
360 *
361 * @param rThat The string to append.
362 * @throws std::bad_alloc On allocation error. The object is left unchanged.
363 * @returns Reference to the object.
364 */
365 Bstr &append(const Bstr &rThat);
366
367 /**
368 * Appends the string @a that to @a rThat.
369 *
370 * @param rThat The string to append.
371 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
372 */
373 HRESULT appendNoThrow(const Bstr &rThat) RT_NOEXCEPT;
374
375 /**
376 * Appends the UTF-8 string @a that to @a rThat.
377 *
378 * @param rThat The string to append.
379 * @throws std::bad_alloc On allocation error. The object is left unchanged.
380 * @returns Reference to the object.
381 */
382 Bstr &append(const RTCString &rThat);
383
384 /**
385 * Appends the UTF-8 string @a that to @a rThat.
386 *
387 * @param rThat The string to append.
388 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
389 */
390 HRESULT appendNoThrow(const RTCString &rThat) RT_NOEXCEPT;
391
392 /**
393 * Appends the UTF-16 string @a pszSrc to @a this.
394 *
395 * @param pwszSrc The C-style UTF-16 string to append.
396 * @throws std::bad_alloc On allocation error. The object is left unchanged.
397 * @returns Reference to the object.
398 */
399 Bstr &append(CBSTR pwszSrc);
400
401 /**
402 * Appends the UTF-16 string @a pszSrc to @a this.
403 *
404 * @param pwszSrc The C-style UTF-16 string to append.
405 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
406 */
407 HRESULT appendNoThrow(CBSTR pwszSrc) RT_NOEXCEPT;
408
409 /**
410 * Appends the UTF-8 string @a pszSrc to @a this.
411 *
412 * @param pszSrc The C-style string to append.
413 * @throws std::bad_alloc On allocation error. The object is left unchanged.
414 * @returns Reference to the object.
415 */
416 Bstr &append(const char *pszSrc);
417
418 /**
419 * Appends the UTF-8 string @a pszSrc to @a this.
420 *
421 * @param pszSrc The C-style string to append.
422 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
423 */
424 HRESULT appendNoThrow(const char *pszSrc) RT_NOEXCEPT;
425
426 /**
427 * Appends the a substring from @a rThat to @a this.
428 *
429 * @param rThat The string to append a substring from.
430 * @param offStart The start of the substring to append (UTF-16
431 * offset, not codepoint).
432 * @param cwcMax The maximum number of UTF-16 units to append.
433 * @throws std::bad_alloc On allocation error. The object is left unchanged.
434 * @returns Reference to the object.
435 */
436 Bstr &append(const Bstr &rThat, size_t offStart, size_t cwcMax = RTSTR_MAX);
437
438 /**
439 * Appends the a substring from @a rThat to @a this.
440 *
441 * @param rThat The string to append a substring from.
442 * @param offStart The start of the substring to append (UTF-16
443 * offset, not codepoint).
444 * @param cwcMax The maximum number of UTF-16 units to append.
445 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
446 */
447 HRESULT appendNoThrow(const Bstr &rThat, size_t offStart, size_t cwcMax = RTSTR_MAX) RT_NOEXCEPT;
448
449 /**
450 * Appends the a substring from UTF-8 @a rThat to @a this.
451 *
452 * @param rThat The string to append a substring from.
453 * @param offStart The start of the substring to append (byte offset,
454 * not codepoint).
455 * @param cchMax The maximum number of bytes to append.
456 * @throws std::bad_alloc On allocation error. The object is left unchanged.
457 * @returns Reference to the object.
458 */
459 Bstr &append(const RTCString &rThat, size_t offStart, size_t cchMax = RTSTR_MAX);
460
461 /**
462 * Appends the a substring from UTF-8 @a rThat to @a this.
463 *
464 * @param rThat The string to append a substring from.
465 * @param offStart The start of the substring to append (byte offset,
466 * not codepoint).
467 * @param cchMax The maximum number of bytes to append.
468 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
469 */
470 HRESULT appendNoThrow(const RTCString &rThat, size_t offStart, size_t cchMax = RTSTR_MAX) RT_NOEXCEPT;
471
472 /**
473 * Appends the first @a cchMax chars from UTF-16 string @a pszThat to @a this.
474 *
475 * @param pwszThat The C-style UTF-16 string to append.
476 * @param cchMax The maximum number of bytes to append.
477 * @throws std::bad_alloc On allocation error. The object is left unchanged.
478 * @returns Reference to the object.
479 */
480 Bstr &append(CBSTR pwszThat, size_t cchMax);
481
482 /**
483 * Appends the first @a cchMax chars from UTF-16 string @a pszThat to @a this.
484 *
485 * @param pwszThat The C-style UTF-16 string to append.
486 * @param cchMax The maximum number of bytes to append.
487 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
488 */
489 HRESULT appendNoThrow(CBSTR pwszThat, size_t cchMax) RT_NOEXCEPT;
490
491 /**
492 * Appends the first @a cchMax chars from string @a pszThat to @a this.
493 *
494 * @param pszThat The C-style string to append.
495 * @param cchMax The maximum number of bytes to append.
496 * @throws std::bad_alloc On allocation error. The object is left unchanged.
497 * @returns Reference to the object.
498 */
499 Bstr &append(const char *pszThat, size_t cchMax);
500
501 /**
502 * Appends the first @a cchMax chars from string @a pszThat to @a this.
503 *
504 * @param pszThat The C-style string to append.
505 * @param cchMax The maximum number of bytes to append.
506 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
507 */
508 HRESULT appendNoThrow(const char *pszThat, size_t cchMax) RT_NOEXCEPT;
509
510 /**
511 * Appends the given character to @a this.
512 *
513 * @param ch The character to append.
514 * @throws std::bad_alloc On allocation error. The object is left unchanged.
515 * @returns Reference to the object.
516 */
517 Bstr &append(char ch);
518
519 /**
520 * Appends the given character to @a this.
521 *
522 * @param ch The character to append.
523 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
524 */
525 HRESULT appendNoThrow(char ch) RT_NOEXCEPT;
526
527 /**
528 * Appends the given unicode code point to @a this.
529 *
530 * @param uc The unicode code point to append.
531 * @throws std::bad_alloc On allocation error. The object is left unchanged.
532 * @returns Reference to the object.
533 */
534 Bstr &appendCodePoint(RTUNICP uc);
535
536 /**
537 * Appends the given unicode code point to @a this.
538 *
539 * @param uc The unicode code point to append.
540 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
541 */
542 HRESULT appendCodePointNoThrow(RTUNICP uc) RT_NOEXCEPT;
543
544 /**
545 * Appends the output of the string format operation (RTStrPrintf).
546 *
547 * @param pszFormat Pointer to the format string,
548 * @see pg_rt_str_format.
549 * @param ... Ellipsis containing the arguments specified by
550 * the format string.
551 *
552 * @throws std::bad_alloc On allocation error. Object state is undefined.
553 *
554 * @returns Reference to the object.
555 */
556 Bstr &appendPrintf(const char *pszFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2);
557
558 /**
559 * Appends the output of the string format operation (RTStrPrintf).
560 *
561 * @param pszFormat Pointer to the format string,
562 * @see pg_rt_str_format.
563 * @param ... Ellipsis containing the arguments specified by
564 * the format string.
565 *
566 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
567 */
568 HRESULT appendPrintfNoThrow(const char *pszFormat, ...) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 2);
569
570 /**
571 * Appends the output of the string format operation (RTStrPrintfV).
572 *
573 * @param pszFormat Pointer to the format string,
574 * @see pg_rt_str_format.
575 * @param va Argument vector containing the arguments
576 * specified by the format string.
577 *
578 * @throws std::bad_alloc On allocation error. Object state is undefined.
579 *
580 * @returns Reference to the object.
581 */
582 Bstr &appendPrintfV(const char *pszFormat, va_list va) RT_IPRT_FORMAT_ATTR(1, 0);
583
584 /**
585 * Appends the output of the string format operation (RTStrPrintfV).
586 *
587 * @param pszFormat Pointer to the format string,
588 * @see pg_rt_str_format.
589 * @param va Argument vector containing the arguments
590 * specified by the format string.
591 *
592 * @returns S_OK, E_OUTOFMEMORY or E_INVAL (bad encoding).
593 */
594 HRESULT appendPrintfVNoThrow(const char *pszFormat, va_list va) RT_NOEXCEPT RT_IPRT_FORMAT_ATTR(1, 0);
595
596 /**
597 * Shortcut to append(), Bstr variant.
598 *
599 * @param rThat The string to append.
600 * @returns Reference to the object.
601 */
602 Bstr &operator+=(const Bstr &rThat)
603 {
604 return append(rThat);
605 }
606
607 /**
608 * Shortcut to append(), RTCString variant.
609 *
610 * @param rThat The string to append.
611 * @returns Reference to the object.
612 */
613 Bstr &operator+=(const RTCString &rThat)
614 {
615 return append(rThat);
616 }
617
618 /**
619 * Shortcut to append(), CBSTR variant.
620 *
621 * @param pwszThat The C-style string to append.
622 * @returns Reference to the object.
623 */
624 Bstr &operator+=(CBSTR pwszThat)
625 {
626 return append(pwszThat);
627 }
628
629 /**
630 * Shortcut to append(), const char * variant.
631 *
632 * @param pszThat The C-style string to append.
633 * @returns Reference to the object.
634 */
635 Bstr &operator+=(const char *pszThat)
636 {
637 return append(pszThat);
638 }
639
640#if 0
641 /**
642 * Shortcut to append(), char variant.
643 *
644 * @param ch The character to append.
645 *
646 * @returns Reference to the object.
647 */
648 Bstr &operator+=(char ch)
649 {
650 return append(ch);
651 }
652#endif
653
654 /** @} */
655
656#if defined(VBOX_WITH_XPCOM)
657 /**
658 * Returns a pointer to the raw member UTF-16 string. If the member string is empty,
659 * returns a pointer to a global variable containing an empty BSTR with a proper zero
660 * length prefix so that Windows is happy.
661 */
662 CBSTR raw() const
663 {
664 if (m_bstr)
665 return m_bstr;
666
667 return g_bstrEmpty;
668 }
669#else
670 /**
671 * Windows-only hack, as the automatically generated headers use BSTR.
672 * So if we don't want to cast like crazy we have to be more loose than
673 * on XPCOM.
674 *
675 * Returns a pointer to the raw member UTF-16 string. If the member string is empty,
676 * returns a pointer to a global variable containing an empty BSTR with a proper zero
677 * length prefix so that Windows is happy.
678 */
679 BSTR raw() const
680 {
681 if (m_bstr)
682 return m_bstr;
683
684 return g_bstrEmpty;
685 }
686#endif
687
688 /**
689 * Returns a non-const raw pointer that allows modifying the string directly.
690 *
691 * @note As opposed to raw(), this DOES return NULL if the member string is
692 * empty because we cannot return a mutable pointer to the global variable
693 * with the empty string.
694 *
695 * @note If modifying the string size (only shrinking it is allows), #jolt() or
696 * #joltNoThrow() must be called!
697 *
698 * @note Do not modify memory beyond the #length() of the string!
699 *
700 * @sa joltNoThrow(), mutalbleRaw(), reserve(), reserveNoThrow()
701 */
702 BSTR mutableRaw() { return m_bstr; }
703
704 /**
705 * Correct the embedded length after using mutableRaw().
706 *
707 * This is needed on COM (Windows) to update the embedded string length. It is
708 * a stub on hosts using XPCOM.
709 *
710 * @param cwcNew The new string length, if handy, otherwise a negative
711 * number.
712 * @sa joltNoThrow(), mutalbleRaw(), reserve(), reserveNoThrow()
713 */
714#ifndef VBOX_WITH_XPCOM
715 void jolt(ssize_t cwcNew = -1);
716#else
717 void jolt(ssize_t cwcNew = -1)
718 {
719 Assert(cwcNew < 0 || (cwcNew == 0 && !m_bstr) || m_bstr[cwcNew] == '\0'); RT_NOREF(cwcNew);
720 }
721#endif
722
723 /**
724 * Correct the embedded length after using mutableRaw().
725 *
726 * This is needed on COM (Windows) to update the embedded string length. It is
727 * a stub on hosts using XPCOM.
728 *
729 * @returns S_OK on success, E_OUTOFMEMORY if shrinking the string failed.
730 * @param cwcNew The new string length, if handy, otherwise a negative
731 * number.
732 * @sa jolt(), mutalbleRaw(), reserve(), reserveNoThrow()
733 */
734#ifndef VBOX_WITH_XPCOM
735 HRESULT joltNoThrow(ssize_t cwcNew = -1) RT_NOEXCEPT;
736#else
737 HRESULT joltNoThrow(ssize_t cwcNew = -1) RT_NOEXCEPT
738 {
739 Assert(cwcNew < 0 || (cwcNew == 0 && !m_bstr) || m_bstr[cwcNew] == '\0'); RT_NOREF(cwcNew);
740 return S_OK;
741 }
742#endif
743
744 /**
745 * Make sure at that least @a cwc of buffer space is reserved.
746 *
747 * Requests that the contained memory buffer have at least cb bytes allocated.
748 * This may expand or shrink the string's storage, but will never truncate the
749 * contained string. In other words, cb will be ignored if it's smaller than
750 * length() + 1.
751 *
752 * @param cwcMin The new minimum string length that the can be stored. This
753 * does not include the terminator.
754 * @param fForce Force this size.
755 *
756 * @throws std::bad_alloc On allocation error. The object is left unchanged.
757 */
758 void reserve(size_t cwcMin, bool fForce = false);
759
760 /**
761 * A C like version of the #reserve() method, i.e. return code instead of throw.
762 *
763 * @returns S_OK or E_OUTOFMEMORY.
764 * @param cwcMin The new minimum string length that the can be stored. This
765 * does not include the terminator.
766 * @param fForce Force this size.
767 */
768 HRESULT reserveNoThrow(size_t cwcMin, bool fForce = false) RT_NOEXCEPT;
769
770 /**
771 * Intended to assign copies of instances to |BSTR| out parameters from
772 * within the interface method. Transfers the ownership of the duplicated
773 * string to the caller.
774 *
775 * If the member string is empty, this allocates an empty BSTR in *pstr
776 * (i.e. makes it point to a new buffer with a null byte).
777 *
778 * @deprecated Use cloneToEx instead to avoid throwing exceptions.
779 */
780 void cloneTo(BSTR *pstr) const
781 {
782 if (pstr)
783 {
784 *pstr = ::SysAllocString((const OLECHAR *)raw()); // raw() returns a pointer to "" if empty
785#ifdef RT_EXCEPTIONS_ENABLED
786 if (!*pstr)
787 throw std::bad_alloc();
788#endif
789 }
790 }
791
792 /**
793 * A version of cloneTo that does not throw any out of memory exceptions, but
794 * returns E_OUTOFMEMORY intead.
795 * @returns S_OK or E_OUTOFMEMORY.
796 */
797 HRESULT cloneToEx(BSTR *pstr) const
798 {
799 if (!pstr)
800 return S_OK;
801 *pstr = ::SysAllocString((const OLECHAR *)raw()); // raw() returns a pointer to "" if empty
802 return pstr ? S_OK : E_OUTOFMEMORY;
803 }
804
805 /**
806 * Intended to assign instances to |BSTR| out parameters from within the
807 * interface method. Transfers the ownership of the original string to the
808 * caller and resets the instance to null.
809 *
810 * As opposed to cloneTo(), this method doesn't create a copy of the
811 * string.
812 *
813 * If the member string is empty, this allocates an empty BSTR in *pstr
814 * (i.e. makes it point to a new buffer with a null byte).
815 *
816 * @param pbstrDst The BSTR variable to detach the string to.
817 *
818 * @throws std::bad_alloc if we failed to allocate a new empty string.
819 */
820 void detachTo(BSTR *pbstrDst)
821 {
822 if (m_bstr)
823 {
824 *pbstrDst = m_bstr;
825 m_bstr = NULL;
826 }
827 else
828 {
829 // allocate null BSTR
830 *pbstrDst = ::SysAllocString((const OLECHAR *)g_bstrEmpty);
831#ifdef RT_EXCEPTIONS_ENABLED
832 if (!*pbstrDst)
833 throw std::bad_alloc();
834#endif
835 }
836 }
837
838 /**
839 * A version of detachTo that does not throw exceptions on out-of-memory
840 * conditions, but instead returns E_OUTOFMEMORY.
841 *
842 * @param pbstrDst The BSTR variable to detach the string to.
843 * @returns S_OK or E_OUTOFMEMORY.
844 */
845 HRESULT detachToEx(BSTR *pbstrDst)
846 {
847 if (m_bstr)
848 {
849 *pbstrDst = m_bstr;
850 m_bstr = NULL;
851 }
852 else
853 {
854 // allocate null BSTR
855 *pbstrDst = ::SysAllocString((const OLECHAR *)g_bstrEmpty);
856 if (!*pbstrDst)
857 return E_OUTOFMEMORY;
858 }
859 return S_OK;
860 }
861
862 /**
863 * Intended to pass instances as |BSTR| out parameters to methods.
864 * Takes the ownership of the returned data.
865 */
866 BSTR *asOutParam()
867 {
868 cleanup();
869 return &m_bstr;
870 }
871
872 /**
873 * Static immutable empty-string object. May be used for comparison purposes.
874 */
875 static const Bstr Empty;
876
877protected:
878
879 void cleanup()
880 {
881 if (m_bstr)
882 {
883 ::SysFreeString(m_bstr);
884 m_bstr = NULL;
885 }
886 }
887
888 /**
889 * Protected internal helper to copy a string. This ignores the previous object
890 * state, so either call this from a constructor or call cleanup() first.
891 *
892 * This variant copies from a zero-terminated UTF-16 string (which need not
893 * be a BSTR, i.e. need not have a length prefix).
894 *
895 * If the source is empty, this sets the member string to NULL.
896 *
897 * @param a_bstrSrc The source string. The caller guarantees
898 * that this is valid UTF-16.
899 *
900 * @throws std::bad_alloc - the object is representing an empty string.
901 */
902 void copyFrom(const OLECHAR *a_bstrSrc)
903 {
904 if (a_bstrSrc && *a_bstrSrc)
905 {
906 m_bstr = ::SysAllocString(a_bstrSrc);
907#ifdef RT_EXCEPTIONS_ENABLED
908 if (!m_bstr)
909 throw std::bad_alloc();
910#endif
911 }
912 else
913 m_bstr = NULL;
914 }
915
916 /**
917 * Protected internal helper to copy a string. This ignores the previous object
918 * state, so either call this from a constructor or call cleanup() first.
919 *
920 * This variant copies and converts from a zero-terminated UTF-8 string.
921 *
922 * If the source is empty, this sets the member string to NULL.
923 *
924 * @param a_pszSrc The source string. The caller guarantees
925 * that this is valid UTF-8.
926 *
927 * @throws std::bad_alloc - the object is representing an empty string.
928 */
929 void copyFrom(const char *a_pszSrc)
930 {
931 copyFromN(a_pszSrc, RTSTR_MAX);
932 }
933
934 /**
935 * Variant of copyFrom for sub-string constructors.
936 *
937 * @param a_pszSrc The source string. The caller guarantees
938 * that this is valid UTF-8.
939 * @param a_cchSrc The maximum number of chars (not codepoints) to
940 * copy. If you pass RTSTR_MAX it'll be exactly
941 * like copyFrom().
942 *
943 * @throws std::bad_alloc - the object is representing an empty string.
944 */
945 void copyFromN(const char *a_pszSrc, size_t a_cchSrc);
946
947 Bstr &appendWorkerUtf16(PCRTUTF16 pwszSrc, size_t cwcSrc);
948 Bstr &appendWorkerUtf8(const char *pszSrc, size_t cchSrc);
949 HRESULT appendWorkerUtf16NoThrow(PCRTUTF16 pwszSrc, size_t cwcSrc) RT_NOEXCEPT;
950 HRESULT appendWorkerUtf8NoThrow(const char *pszSrc, size_t cchSrc) RT_NOEXCEPT;
951
952 static DECLCALLBACK(size_t) printfOutputCallbackNoThrow(void *pvArg, const char *pachChars, size_t cbChars) RT_NOEXCEPT;
953
954 BSTR m_bstr;
955
956 friend class Utf8Str; /* to access our raw_copy() */
957};
958
959/* symmetric compare operators */
960inline bool operator==(CBSTR l, const Bstr &r) { return r.operator==(l); }
961inline bool operator!=(CBSTR l, const Bstr &r) { return r.operator!=(l); }
962inline bool operator==(BSTR l, const Bstr &r) { return r.operator==(l); }
963inline bool operator!=(BSTR l, const Bstr &r) { return r.operator!=(l); }
964
965
966
967
968/**
969 * String class used universally in Main for UTF-8 strings.
970 *
971 * This is based on RTCString, to which some functionality has been
972 * moved. Here we keep things that are specific to Main, such as conversions
973 * with UTF-16 strings (Bstr).
974 *
975 * Like RTCString, Utf8Str does not differentiate between NULL strings
976 * and empty strings. In other words, Utf8Str("") and Utf8Str(NULL) behave the
977 * same. In both cases, RTCString allocates no memory, reports
978 * a zero length and zero allocated bytes for both, and returns an empty
979 * C string from c_str().
980 *
981 * @note All Utf8Str methods ASSUMES valid UTF-8 or UTF-16 input strings.
982 * The VirtualBox policy in this regard is to validate strings coming
983 * from external sources before passing them to Utf8Str or Bstr.
984 */
985class Utf8Str : public RTCString
986{
987public:
988
989 Utf8Str() {}
990
991 Utf8Str(const RTCString &that)
992 : RTCString(that)
993 {}
994
995 Utf8Str(const char *that)
996 : RTCString(that)
997 {}
998
999 Utf8Str(const Bstr &that)
1000 {
1001 copyFrom(that.raw());
1002 }
1003
1004 Utf8Str(CBSTR that, size_t a_cwcSize = RTSTR_MAX)
1005 {
1006 copyFrom(that, a_cwcSize);
1007 }
1008
1009 Utf8Str(const char *a_pszSrc, size_t a_cchSrc)
1010 : RTCString(a_pszSrc, a_cchSrc)
1011 {
1012 }
1013
1014 /**
1015 * Constructs a new string given the format string and the list of the
1016 * arguments for the format string.
1017 *
1018 * @param a_pszFormat Pointer to the format string (UTF-8),
1019 * @see pg_rt_str_format.
1020 * @param a_va Argument vector containing the arguments
1021 * specified by the format string.
1022 * @sa RTCString::printfV
1023 */
1024 Utf8Str(const char *a_pszFormat, va_list a_va) RT_IPRT_FORMAT_ATTR(1, 0)
1025 : RTCString(a_pszFormat, a_va)
1026 {
1027 }
1028
1029 Utf8Str& operator=(const RTCString &that)
1030 {
1031 RTCString::operator=(that);
1032 return *this;
1033 }
1034
1035 Utf8Str& operator=(const char *that)
1036 {
1037 RTCString::operator=(that);
1038 return *this;
1039 }
1040
1041 Utf8Str& operator=(const Bstr &that)
1042 {
1043 cleanup();
1044 copyFrom(that.raw());
1045 return *this;
1046 }
1047
1048 Utf8Str& operator=(CBSTR that)
1049 {
1050 cleanup();
1051 copyFrom(that);
1052 return *this;
1053 }
1054
1055 /**
1056 * Extended assignment method that returns a COM status code instead of an
1057 * exception on failure.
1058 *
1059 * @returns S_OK or E_OUTOFMEMORY.
1060 * @param a_rSrcStr The source string
1061 */
1062 HRESULT assignEx(Utf8Str const &a_rSrcStr)
1063 {
1064 return copyFromExNComRC(a_rSrcStr.m_psz, 0, a_rSrcStr.m_cch);
1065 }
1066
1067 /**
1068 * Extended assignment method that returns a COM status code instead of an
1069 * exception on failure.
1070 *
1071 * @returns S_OK, E_OUTOFMEMORY or E_INVALIDARG.
1072 * @param a_rSrcStr The source string
1073 * @param a_offSrc The character (byte) offset of the substring.
1074 * @param a_cchSrc The number of characters (bytes) to copy from the source
1075 * string.
1076 */
1077 HRESULT assignEx(Utf8Str const &a_rSrcStr, size_t a_offSrc, size_t a_cchSrc)
1078 {
1079 if ( a_offSrc + a_cchSrc > a_rSrcStr.m_cch
1080 || a_offSrc > a_rSrcStr.m_cch)
1081 return E_INVALIDARG;
1082 return copyFromExNComRC(a_rSrcStr.m_psz, a_offSrc, a_cchSrc);
1083 }
1084
1085 /**
1086 * Extended assignment method that returns a COM status code instead of an
1087 * exception on failure.
1088 *
1089 * @returns S_OK or E_OUTOFMEMORY.
1090 * @param a_pcszSrc The source string
1091 */
1092 HRESULT assignEx(const char *a_pcszSrc)
1093 {
1094 return copyFromExNComRC(a_pcszSrc, 0, a_pcszSrc ? strlen(a_pcszSrc) : 0);
1095 }
1096
1097 /**
1098 * Extended assignment method that returns a COM status code instead of an
1099 * exception on failure.
1100 *
1101 * @returns S_OK or E_OUTOFMEMORY.
1102 * @param a_pcszSrc The source string
1103 * @param a_cchSrc The number of characters (bytes) to copy from the source
1104 * string.
1105 */
1106 HRESULT assignEx(const char *a_pcszSrc, size_t a_cchSrc)
1107 {
1108 return copyFromExNComRC(a_pcszSrc, 0, a_cchSrc);
1109 }
1110
1111 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1112
1113#if defined(VBOX_WITH_XPCOM)
1114 /**
1115 * Intended to assign instances to |char *| out parameters from within the
1116 * interface method. Transfers the ownership of the duplicated string to the
1117 * caller.
1118 *
1119 * This allocates a single 0 byte in the target if the member string is empty.
1120 *
1121 * This uses XPCOM memory allocation and thus only works on XPCOM. MSCOM doesn't
1122 * like char* strings anyway.
1123 */
1124 void cloneTo(char **pstr) const;
1125
1126 /**
1127 * A version of cloneTo that does not throw allocation errors but returns
1128 * E_OUTOFMEMORY instead.
1129 * @returns S_OK or E_OUTOFMEMORY (COM status codes).
1130 */
1131 HRESULT cloneToEx(char **pstr) const;
1132#endif
1133
1134 /**
1135 * Intended to assign instances to |BSTR| out parameters from within the
1136 * interface method. Transfers the ownership of the duplicated string to the
1137 * caller.
1138 */
1139 void cloneTo(BSTR *pstr) const
1140 {
1141 if (pstr)
1142 {
1143 Bstr bstr(*this);
1144 bstr.cloneTo(pstr);
1145 }
1146 }
1147
1148 /**
1149 * A version of cloneTo that does not throw allocation errors but returns
1150 * E_OUTOFMEMORY instead.
1151 *
1152 * @param pbstr Where to store a clone of the string.
1153 * @returns S_OK or E_OUTOFMEMORY (COM status codes).
1154 */
1155 HRESULT cloneToEx(BSTR *pbstr) const
1156 {
1157 if (!pbstr)
1158 return S_OK;
1159 Bstr bstr(*this);
1160 return bstr.detachToEx(pbstr);
1161 }
1162
1163 /**
1164 * Safe assignment from BSTR.
1165 *
1166 * @param pbstrSrc The source string.
1167 * @returns S_OK or E_OUTOFMEMORY (COM status codes).
1168 */
1169 HRESULT cloneEx(CBSTR pbstrSrc)
1170 {
1171 cleanup();
1172 return copyFromEx(pbstrSrc);
1173 }
1174
1175 /**
1176 * Removes a trailing slash from the member string, if present.
1177 * Calls RTPathStripTrailingSlash() without having to mess with mutableRaw().
1178 */
1179 Utf8Str& stripTrailingSlash();
1180
1181 /**
1182 * Removes a trailing filename from the member string, if present.
1183 * Calls RTPathStripFilename() without having to mess with mutableRaw().
1184 */
1185 Utf8Str& stripFilename();
1186
1187 /**
1188 * Removes the path component from the member string, if present.
1189 * Calls RTPathFilename() without having to mess with mutableRaw().
1190 */
1191 Utf8Str& stripPath();
1192
1193 /**
1194 * Removes a trailing file name suffix from the member string, if present.
1195 * Calls RTPathStripSuffix() without having to mess with mutableRaw().
1196 */
1197 Utf8Str& stripSuffix();
1198
1199 /**
1200 * Parses key=value pairs.
1201 *
1202 * @returns offset of the @a a_rPairSeparator following the returned value.
1203 * @retval npos is returned if there are no more key/value pairs.
1204 *
1205 * @param a_rKey Reference to variable that should receive
1206 * the key substring. This is set to null if
1207 * no key/value found. (It's also possible the
1208 * key is an empty string, so be careful.)
1209 * @param a_rValue Reference to variable that should receive
1210 * the value substring. This is set to null if
1211 * no key/value found. (It's also possible the
1212 * value is an empty string, so be careful.)
1213 * @param a_offStart The offset to start searching from. This is
1214 * typically 0 for the first call, and the
1215 * return value of the previous call for the
1216 * subsequent ones.
1217 * @param a_rPairSeparator The pair separator string. If this is an
1218 * empty string, the whole string will be
1219 * considered as a single key/value pair.
1220 * @param a_rKeyValueSeparator The key/value separator string.
1221 */
1222 size_t parseKeyValue(Utf8Str &a_rKey, Utf8Str &a_rValue, size_t a_offStart = 0,
1223 const Utf8Str &a_rPairSeparator = ",", const Utf8Str &a_rKeyValueSeparator = "=") const;
1224
1225 /**
1226 * Static immutable empty-string object. May be used for comparison purposes.
1227 */
1228 static const Utf8Str Empty;
1229protected:
1230
1231 void copyFrom(CBSTR a_pbstr, size_t a_cwcMax = RTSTR_MAX);
1232 HRESULT copyFromEx(CBSTR a_pbstr);
1233 HRESULT copyFromExNComRC(const char *a_pcszSrc, size_t a_offSrc, size_t a_cchSrc);
1234
1235 friend class Bstr; /* to access our raw_copy() */
1236};
1237
1238/**
1239 * Class with RTCString::printf as constructor for your convenience.
1240 *
1241 * Constructing a Utf8Str string object from a format string and a variable
1242 * number of arguments can easily be confused with the other Utf8Str
1243 * constructures, thus this child class.
1244 *
1245 * The usage of this class is like the following:
1246 * @code
1247 Utf8StrFmt strName("program name = %s", argv[0]);
1248 @endcode
1249 */
1250class Utf8StrFmt : public Utf8Str
1251{
1252public:
1253
1254 /**
1255 * Constructs a new string given the format string and the list of the
1256 * arguments for the format string.
1257 *
1258 * @param a_pszFormat Pointer to the format string (UTF-8),
1259 * @see pg_rt_str_format.
1260 * @param ... Ellipsis containing the arguments specified by
1261 * the format string.
1262 */
1263 explicit Utf8StrFmt(const char *a_pszFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2)
1264 {
1265 va_list va;
1266 va_start(va, a_pszFormat);
1267 printfV(a_pszFormat, va);
1268 va_end(va);
1269 }
1270
1271 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1272
1273protected:
1274 Utf8StrFmt()
1275 { }
1276
1277private:
1278};
1279
1280/**
1281 * The BstrFmt class is a shortcut to <tt>Bstr(Utf8StrFmt(...))</tt>.
1282 */
1283class BstrFmt : public Bstr
1284{
1285public:
1286
1287 /**
1288 * Constructs a new string given the format string and the list of the
1289 * arguments for the format string.
1290 *
1291 * @param aFormat printf-like format string (in UTF-8 encoding).
1292 * @param ... List of the arguments for the format string.
1293 */
1294 explicit BstrFmt(const char *aFormat, ...) RT_IPRT_FORMAT_ATTR(1, 2)
1295 {
1296 va_list args;
1297 va_start(args, aFormat);
1298 copyFrom(Utf8Str(aFormat, args).c_str());
1299 va_end(args);
1300 }
1301
1302 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1303};
1304
1305/**
1306 * The BstrFmtVA class is a shortcut to <tt>Bstr(Utf8Str(format,va))</tt>.
1307 */
1308class BstrFmtVA : public Bstr
1309{
1310public:
1311
1312 /**
1313 * Constructs a new string given the format string and the list of the
1314 * arguments for the format string.
1315 *
1316 * @param aFormat printf-like format string (in UTF-8 encoding).
1317 * @param aArgs List of arguments for the format string
1318 */
1319 BstrFmtVA(const char *aFormat, va_list aArgs) RT_IPRT_FORMAT_ATTR(1, 0)
1320 {
1321 copyFrom(Utf8Str(aFormat, aArgs).c_str());
1322 }
1323
1324 RTMEMEF_NEW_AND_DELETE_OPERATORS();
1325};
1326
1327} /* namespace com */
1328
1329/** @} */
1330
1331#endif /* !VBOX_INCLUDED_com_string_h */
1332
Note: See TracBrowser for help on using the repository browser.

© 2025 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette