VirtualBox

source: vbox/trunk/src/VBox/Runtime/common/string/ministring.cpp@ 36561

Last change on this file since 36561 was 36561, checked in by vboxsync, 14 years ago

RTCString::join: Optimization.

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 11.6 KB
Line 
1/* $Id: ministring.cpp 36561 2011-04-05 13:42:59Z vboxsync $ */
2/** @file
3 * IPRT - Mini C++ string class.
4 *
5 * This is a base for both Utf8Str and other places where IPRT may want to use
6 * a lean C++ string class.
7 */
8
9/*
10 * Copyright (C) 2007-2011 Oracle Corporation
11 *
12 * This file is part of VirtualBox Open Source Edition (OSE), as
13 * available from http://www.virtualbox.org. This file is free software;
14 * you can redistribute it and/or modify it under the terms of the GNU
15 * General Public License (GPL) as published by the Free Software
16 * Foundation, in version 2 as it comes in the "COPYING" file of the
17 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
18 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
19 *
20 * The contents of this file may alternatively be used under the terms
21 * of the Common Development and Distribution License Version 1.0
22 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
23 * VirtualBox OSE distribution, in which case the provisions of the
24 * CDDL are applicable instead of those of the GPL.
25 *
26 * You may elect to license modified versions of this file under the
27 * terms and conditions of either the GPL or the CDDL or both.
28 */
29
30
31/*******************************************************************************
32* Header Files *
33*******************************************************************************/
34#include <iprt/cpp/ministring.h>
35
36
37/*******************************************************************************
38* Global Variables *
39*******************************************************************************/
40const size_t RTCString::npos = ~(size_t)0;
41
42
43/*******************************************************************************
44* Defined Constants And Macros *
45*******************************************************************************/
46/** Allocation block alignment used when appending bytes to a string. */
47#define IPRT_MINISTRING_APPEND_ALIGNMENT 64
48
49
50RTCString &RTCString::printf(const char *pszFormat, ...)
51{
52 va_list va;
53 va_start(va, pszFormat);
54 printfV(pszFormat, va);
55 va_end(va);
56 return *this;
57}
58
59/**
60 * Callback used with RTStrFormatV by RTCString::printfV.
61 *
62 * @returns The number of bytes added (not used).
63 *
64 * @param pvArg The string object.
65 * @param pachChars The characters to append.
66 * @param cbChars The number of characters. 0 on the final callback.
67 */
68/*static*/ DECLCALLBACK(size_t)
69RTCString::printfOutputCallback(void *pvArg, const char *pachChars, size_t cbChars)
70{
71 RTCString *pThis = (RTCString *)pvArg;
72 if (cbChars)
73 {
74 size_t cchBoth = pThis->m_cch + cbChars;
75 if (cchBoth >= pThis->m_cbAllocated)
76 {
77 /* Double the buffer size, if it's less that _4M. Align sizes like
78 for append. */
79 size_t cbAlloc = RT_ALIGN_Z(pThis->m_cbAllocated, IPRT_MINISTRING_APPEND_ALIGNMENT);
80 cbAlloc += RT_MIN(cbAlloc, _4M);
81 if (cbAlloc <= cchBoth)
82 cbAlloc = RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT);
83 pThis->reserve(cbAlloc);
84#ifndef RT_EXCEPTIONS_ENABLED
85 AssertReleaseReturn(pThis->capacity() > cchBoth, 0);
86#endif
87 }
88
89 memcpy(&pThis->m_psz[pThis->m_cch], pachChars, cbChars);
90 pThis->m_cch = cchBoth;
91 pThis->m_psz[cchBoth] = '\0';
92 }
93 return cbChars;
94}
95
96RTCString &RTCString::printfV(const char *pszFormat, va_list va)
97{
98 cleanup();
99 RTStrFormatV(printfOutputCallback, this, NULL, NULL, pszFormat, va);
100 return *this;
101}
102
103RTCString &RTCString::append(const RTCString &that)
104{
105 size_t cchThat = that.length();
106 if (cchThat)
107 {
108 size_t cchThis = length();
109 size_t cchBoth = cchThis + cchThat;
110
111 if (cchBoth >= m_cbAllocated)
112 {
113 reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
114 // calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
115#ifndef RT_EXCEPTIONS_ENABLED
116 AssertRelease(capacity() > cchBoth);
117#endif
118 }
119
120 memcpy(m_psz + cchThis, that.m_psz, cchThat);
121 m_psz[cchBoth] = '\0';
122 m_cch = cchBoth;
123 }
124 return *this;
125}
126
127RTCString &RTCString::append(const char *pszThat)
128{
129 size_t cchThat = strlen(pszThat);
130 if (cchThat)
131 {
132 size_t cchThis = length();
133 size_t cchBoth = cchThis + cchThat;
134
135 if (cchBoth >= m_cbAllocated)
136 {
137 reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
138 // calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
139#ifndef RT_EXCEPTIONS_ENABLED
140 AssertRelease(capacity() > cchBoth);
141#endif
142 }
143
144 memcpy(&m_psz[cchThis], pszThat, cchThat);
145 m_psz[cchBoth] = '\0';
146 m_cch = cchBoth;
147 }
148 return *this;
149}
150
151RTCString& RTCString::append(char ch)
152{
153 Assert((unsigned char)ch < 0x80); /* Don't create invalid UTF-8. */
154 if (ch)
155 {
156 // allocate in chunks of 20 in case this gets called several times
157 if (m_cch + 1 >= m_cbAllocated)
158 {
159 reserve(RT_ALIGN_Z(m_cch + 2, IPRT_MINISTRING_APPEND_ALIGNMENT));
160 // calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
161#ifndef RT_EXCEPTIONS_ENABLED
162 AssertRelease(capacity() > m_cch + 1);
163#endif
164 }
165
166 m_psz[m_cch] = ch;
167 m_psz[++m_cch] = '\0';
168 }
169 return *this;
170}
171
172RTCString &RTCString::appendCodePoint(RTUNICP uc)
173{
174 /*
175 * Single byte encoding.
176 */
177 if (uc < 0x80)
178 return RTCString::append((char)uc);
179
180 /*
181 * Multibyte encoding.
182 * Assume max encoding length when resizing the string, that's simpler.
183 */
184 AssertReturn(uc <= UINT32_C(0x7fffffff), *this);
185
186 if (m_cch + 6 >= m_cbAllocated)
187 {
188 reserve(RT_ALIGN_Z(m_cch + 6 + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
189 // calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
190#ifndef RT_EXCEPTIONS_ENABLED
191 AssertRelease(capacity() > m_cch + 6);
192#endif
193 }
194
195 char *pszNext = RTStrPutCp(&m_psz[m_cch], uc);
196 m_cch = pszNext - m_psz;
197 *pszNext = '\0';
198
199 return *this;
200}
201
202size_t RTCString::find(const char *pcszFind, size_t pos /*= 0*/) const
203{
204 const char *pszThis, *p;
205
206 if ( ((pszThis = c_str()))
207 && (pos < length())
208 && ((p = strstr(pszThis + pos, pcszFind)))
209 )
210 return p - pszThis;
211
212 return npos;
213}
214
215void RTCString::findReplace(char cFind, char cReplace)
216{
217 for (size_t i = 0; i < length(); ++i)
218 {
219 char *p = &m_psz[i];
220 if (*p == cFind)
221 *p = cReplace;
222 }
223}
224
225RTCString RTCString::substrCP(size_t pos /*= 0*/, size_t n /*= npos*/) const
226{
227 RTCString ret;
228
229 if (n)
230 {
231 const char *psz;
232
233 if ((psz = c_str()))
234 {
235 RTUNICP cp;
236
237 // walk the UTF-8 characters until where the caller wants to start
238 size_t i = pos;
239 while (*psz && i--)
240 if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
241 return ret; // return empty string on bad encoding
242
243 const char *pFirst = psz;
244
245 if (n == npos)
246 // all the rest:
247 ret = pFirst;
248 else
249 {
250 i = n;
251 while (*psz && i--)
252 if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
253 return ret; // return empty string on bad encoding
254
255 size_t cbCopy = psz - pFirst;
256 if (cbCopy)
257 {
258 ret.reserve(cbCopy + 1); // may throw bad_alloc
259#ifndef RT_EXCEPTIONS_ENABLED
260 AssertRelease(capacity() >= cbCopy + 1);
261#endif
262 memcpy(ret.m_psz, pFirst, cbCopy);
263 ret.m_cch = cbCopy;
264 ret.m_psz[cbCopy] = '\0';
265 }
266 }
267 }
268 }
269
270 return ret;
271}
272
273bool RTCString::endsWith(const RTCString &that, CaseSensitivity cs /*= CaseSensitive*/) const
274{
275 size_t l1 = length();
276 if (l1 == 0)
277 return false;
278
279 size_t l2 = that.length();
280 if (l1 < l2)
281 return false;
282 /** @todo r=bird: If l2 is 0, then m_psz can be NULL and we will crash. See
283 * also handling of l2 == in startsWith. */
284
285 size_t l = l1 - l2;
286 if (cs == CaseSensitive)
287 return ::RTStrCmp(&m_psz[l], that.m_psz) == 0;
288 return ::RTStrICmp(&m_psz[l], that.m_psz) == 0;
289}
290
291bool RTCString::startsWith(const RTCString &that, CaseSensitivity cs /*= CaseSensitive*/) const
292{
293 size_t l1 = length();
294 size_t l2 = that.length();
295 if (l1 == 0 || l2 == 0) /** @todo r=bird: this differs from endsWith, and I think other IPRT code. If l2 == 0, it matches anything. */
296 return false;
297
298 if (l1 < l2)
299 return false;
300
301 if (cs == CaseSensitive)
302 return ::RTStrNCmp(m_psz, that.m_psz, l2) == 0;
303 return ::RTStrNICmp(m_psz, that.m_psz, l2) == 0;
304}
305
306bool RTCString::contains(const RTCString &that, CaseSensitivity cs /*= CaseSensitive*/) const
307{
308 /** @todo r-bird: Not checking for NULL strings like startsWith does (and
309 * endsWith only does half way). */
310 if (cs == CaseSensitive)
311 return ::RTStrStr(m_psz, that.m_psz) != NULL;
312 return ::RTStrIStr(m_psz, that.m_psz) != NULL;
313}
314
315int RTCString::toInt(uint64_t &i) const
316{
317 if (!m_psz)
318 return VERR_NO_DIGITS;
319 return RTStrToUInt64Ex(m_psz, NULL, 0, &i);
320}
321
322int RTCString::toInt(uint32_t &i) const
323{
324 if (!m_psz)
325 return VERR_NO_DIGITS;
326 return RTStrToUInt32Ex(m_psz, NULL, 0, &i);
327}
328
329RTCList<RTCString, RTCString *>
330RTCString::split(const RTCString &a_rstrSep, SplitMode mode /* = RemoveEmptyParts */)
331{
332 RTCList<RTCString> strRet;
333 if (!m_psz)
334 return strRet;
335 if (a_rstrSep.isEmpty())
336 {
337 strRet.append(RTCString(m_psz));
338 return strRet;
339 }
340
341 size_t cch = m_cch;
342 char const *pszTmp = m_psz;
343 while (cch > 0)
344 {
345 char const *pszNext = strstr(pszTmp, a_rstrSep.c_str());
346 if (!pszNext)
347 {
348 strRet.append(RTCString(pszTmp, cch));
349 break;
350 }
351 size_t cchNext = pszNext - pszTmp;
352 if ( cchNext > 0
353 || mode == KeepEmptyParts)
354 strRet.append(RTCString(pszTmp, cchNext));
355 pszTmp += cchNext + a_rstrSep.length();
356 cch -= cchNext + a_rstrSep.length();
357 }
358
359 return strRet;
360}
361
362/* static */
363RTCString
364RTCString::join(const RTCList<RTCString, RTCString *> &a_rList,
365 const RTCString &a_rstrSep /* = "" */)
366{
367 RTCString strRet;
368 if (a_rList.size() > 1)
369 {
370 /* calc the required size */
371 size_t cbNeeded = a_rstrSep.length() * (a_rList.size() - 1) + 1;
372 for (size_t i = 0; i < a_rList.size(); ++i)
373 cbNeeded += a_rList.at(i).length();
374 strRet.reserve(cbNeeded);
375
376 /* do the appending. */
377 for (size_t i = 0; i < a_rList.size() - 1; ++i)
378 {
379 strRet.append(a_rList.at(i));
380 strRet.append(a_rstrSep);
381 }
382 strRet.append(a_rList.last());
383 }
384 /* special case: one list item. */
385 else if (a_rList.size() > 0)
386 strRet.append(a_rList.last());
387
388 return strRet;
389}
390
391const RTCString operator+(const RTCString &a_rStr1, const RTCString &a_rStr2)
392{
393 RTCString strRet(a_rStr1);
394 strRet += a_rStr2;
395 return strRet;
396}
397
398const RTCString operator+(const RTCString &a_rStr1, const char *a_pszStr2)
399{
400 RTCString strRet(a_rStr1);
401 strRet += a_pszStr2;
402 return strRet;
403}
404
405const RTCString operator+(const char *a_psz1, const RTCString &a_rStr2)
406{
407 RTCString strRet(a_psz1);
408 strRet += a_rStr2;
409 return strRet;
410}
411
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette