VirtualBox

source: vbox/trunk/src/VBox/Runtime/common/string/ministring.cpp@ 35567

Last change on this file since 35567 was 35567, checked in by vboxsync, 14 years ago

IPRT: fix rare crash in MiniString::substr(); rename substr() to substrCP() and add a substr that operates on bytes, not codepoints; more to come

  • Property svn:eol-style set to native
  • Property svn:keywords set to Author Date Id Revision
File size: 9.7 KB
Line 
1/* $Id: ministring.cpp 35567 2011-01-14 14:16:45Z vboxsync $ */
2/** @file
3 * IPRT - Mini C++ string class.
4 *
5 * This is a base for both Utf8Str and other places where IPRT may want to use
6 * a lean C++ string class.
7 */
8
9/*
10 * Copyright (C) 2007-2010 Oracle Corporation
11 *
12 * This file is part of VirtualBox Open Source Edition (OSE), as
13 * available from http://www.virtualbox.org. This file is free software;
14 * you can redistribute it and/or modify it under the terms of the GNU
15 * General Public License (GPL) as published by the Free Software
16 * Foundation, in version 2 as it comes in the "COPYING" file of the
17 * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
18 * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
19 *
20 * The contents of this file may alternatively be used under the terms
21 * of the Common Development and Distribution License Version 1.0
22 * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
23 * VirtualBox OSE distribution, in which case the provisions of the
24 * CDDL are applicable instead of those of the GPL.
25 *
26 * You may elect to license modified versions of this file under the
27 * terms and conditions of either the GPL or the CDDL or both.
28 */
29
30
31/*******************************************************************************
32* Header Files *
33*******************************************************************************/
34#include <iprt/cpp/ministring.h>
35using namespace iprt;
36
37
38/*******************************************************************************
39* Global Variables *
40*******************************************************************************/
41const size_t MiniString::npos = ~(size_t)0;
42
43/*******************************************************************************
44* Defined Constants And Macros *
45*******************************************************************************/
46/** Allocation block alignment used when appending bytes to a string. */
47#define IPRT_MINISTRING_APPEND_ALIGNMENT 64
48
49
50MiniString &MiniString::printf(const char *pszFormat, ...)
51{
52 va_list va;
53 va_start(va, pszFormat);
54 printfV(pszFormat, va);
55 va_end(va);
56 return *this;
57}
58
59/**
60 * Callback used with RTStrFormatV by MiniString::printfV.
61 *
62 * @returns The number of bytes added (not used).
63 *
64 * @param pvArg The string object.
65 * @param pachChars The characters to append.
66 * @param cbChars The number of characters. 0 on the final callback.
67 */
68/*static*/ DECLCALLBACK(size_t)
69MiniString::printfOutputCallback(void *pvArg, const char *pachChars, size_t cbChars)
70{
71 MiniString *pThis = (MiniString *)pvArg;
72 if (cbChars)
73 {
74 size_t cchBoth = pThis->m_cch + cbChars;
75 if (cchBoth >= pThis->m_cbAllocated)
76 {
77 /* Double the buffer size, if it's less that _4M. Align sizes like
78 for append. */
79 size_t cbAlloc = RT_ALIGN_Z(pThis->m_cbAllocated, IPRT_MINISTRING_APPEND_ALIGNMENT);
80 cbAlloc += RT_MIN(cbAlloc, _4M);
81 if (cbAlloc <= cchBoth)
82 cbAlloc = RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT);
83 pThis->reserve(cbAlloc);
84#ifndef RT_EXCEPTIONS_ENABLED
85 AssertReleaseReturn(pThis->capacity() > cchBoth, 0);
86#endif
87 }
88
89 memcpy(&pThis->m_psz[pThis->m_cch], pachChars, cbChars);
90 pThis->m_cch = cchBoth;
91 pThis->m_psz[cchBoth] = '\0';
92 }
93 return cbChars;
94}
95
96MiniString &MiniString::printfV(const char *pszFormat, va_list va)
97{
98 cleanup();
99 RTStrFormatV(printfOutputCallback, this, NULL, NULL, pszFormat, va);
100 return *this;
101}
102
103MiniString &MiniString::append(const MiniString &that)
104{
105 size_t cchThat = that.length();
106 if (cchThat)
107 {
108 size_t cchThis = length();
109 size_t cchBoth = cchThis + cchThat;
110
111 if (cchBoth >= m_cbAllocated)
112 {
113 reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
114 // calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
115#ifndef RT_EXCEPTIONS_ENABLED
116 AssertRelease(capacity() > cchBoth);
117#endif
118 }
119
120 memcpy(m_psz + cchThis, that.m_psz, cchThat);
121 m_psz[cchBoth] = '\0';
122 m_cch = cchBoth;
123 }
124 return *this;
125}
126
127MiniString &MiniString::append(const char *pszThat)
128{
129 size_t cchThat = strlen(pszThat);
130 if (cchThat)
131 {
132 size_t cchThis = length();
133 size_t cchBoth = cchThis + cchThat;
134
135 if (cchBoth >= m_cbAllocated)
136 {
137 reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
138 // calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
139#ifndef RT_EXCEPTIONS_ENABLED
140 AssertRelease(capacity() > cchBoth);
141#endif
142 }
143
144 memcpy(&m_psz[cchThis], pszThat, cchThat);
145 m_psz[cchBoth] = '\0';
146 m_cch = cchBoth;
147 }
148 return *this;
149}
150
151MiniString& MiniString::append(char ch)
152{
153 Assert((unsigned char)ch < 0x80); /* Don't create invalid UTF-8. */
154 if (ch)
155 {
156 // allocate in chunks of 20 in case this gets called several times
157 if (m_cch + 1 >= m_cbAllocated)
158 {
159 reserve(RT_ALIGN_Z(m_cch + 2, IPRT_MINISTRING_APPEND_ALIGNMENT));
160 // calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
161#ifndef RT_EXCEPTIONS_ENABLED
162 AssertRelease(capacity() > m_cch + 1);
163#endif
164 }
165
166 m_psz[m_cch] = ch;
167 m_psz[++m_cch] = '\0';
168 }
169 return *this;
170}
171
172MiniString &MiniString::appendCodePoint(RTUNICP uc)
173{
174 /*
175 * Single byte encoding.
176 */
177 if (uc < 0x80)
178 return MiniString::append((char)uc);
179
180 /*
181 * Multibyte encoding.
182 * Assume max encoding length when resizing the string, that's simpler.
183 */
184 AssertReturn(uc <= UINT32_C(0x7fffffff), *this);
185
186 if (m_cch + 6 >= m_cbAllocated)
187 {
188 reserve(RT_ALIGN_Z(m_cch + 6 + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
189 // calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
190#ifndef RT_EXCEPTIONS_ENABLED
191 AssertRelease(capacity() > m_cch + 6);
192#endif
193 }
194
195 char *pszNext = RTStrPutCp(&m_psz[m_cch], uc);
196 m_cch = pszNext - m_psz;
197 *pszNext = '\0';
198
199 return *this;
200}
201
202size_t MiniString::find(const char *pcszFind, size_t pos /*= 0*/)
203 const
204{
205 const char *pszThis, *p;
206
207 if ( ((pszThis = c_str()))
208 && (pos < length())
209 && ((p = strstr(pszThis + pos, pcszFind)))
210 )
211 return p - pszThis;
212
213 return npos;
214}
215
216void MiniString::findReplace(char cFind, char cReplace)
217{
218 for (size_t i = 0; i < length(); ++i)
219 {
220 char *p = &m_psz[i];
221 if (*p == cFind)
222 *p = cReplace;
223 }
224}
225
226MiniString MiniString::substrCP(size_t pos /*= 0*/, size_t n /*= npos*/)
227 const
228{
229 MiniString ret;
230
231 if (n)
232 {
233 const char *psz;
234
235 if ((psz = c_str()))
236 {
237 RTUNICP cp;
238
239 // walk the UTF-8 characters until where the caller wants to start
240 size_t i = pos;
241 while (*psz && i--)
242 if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
243 return ret; // return empty string on bad encoding
244
245 const char *pFirst = psz;
246
247 if (n == npos)
248 // all the rest:
249 ret = pFirst;
250 else
251 {
252 i = n;
253 while (*psz && i--)
254 if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
255 return ret; // return empty string on bad encoding
256
257 size_t cbCopy = psz - pFirst;
258 if (cbCopy)
259 {
260 ret.reserve(cbCopy + 1); // may throw bad_alloc
261#ifndef RT_EXCEPTIONS_ENABLED
262 AssertRelease(capacity() >= cbCopy + 1);
263#endif
264 memcpy(ret.m_psz, pFirst, cbCopy);
265 ret.m_cch = cbCopy;
266 ret.m_psz[cbCopy] = '\0';
267 }
268 }
269 }
270 }
271
272 return ret;
273}
274
275bool MiniString::endsWith(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
276{
277 size_t l1 = length();
278 if (l1 == 0)
279 return false;
280
281 size_t l2 = that.length();
282 if (l1 < l2)
283 return false;
284 /** @todo r=bird: If l2 is 0, then m_psz can be NULL and we will crash. See
285 * also handling of l2 == in startsWith. */
286
287 size_t l = l1 - l2;
288 if (cs == CaseSensitive)
289 return ::RTStrCmp(&m_psz[l], that.m_psz) == 0;
290 else
291 return ::RTStrICmp(&m_psz[l], that.m_psz) == 0;
292}
293
294bool MiniString::startsWith(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
295{
296 size_t l1 = length();
297 size_t l2 = that.length();
298 if (l1 == 0 || l2 == 0) /** @todo r=bird: this differs from endsWith, and I think other IPRT code. If l2 == 0, it matches anything. */
299 return false;
300
301 if (l1 < l2)
302 return false;
303
304 if (cs == CaseSensitive)
305 return ::RTStrNCmp(m_psz, that.m_psz, l2) == 0;
306 else
307 return ::RTStrNICmp(m_psz, that.m_psz, l2) == 0;
308}
309
310bool MiniString::contains(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
311{
312 /** @todo r-bird: Not checking for NULL strings like startsWith does (and
313 * endsWith only does half way). */
314 if (cs == CaseSensitive)
315 return ::RTStrStr(m_psz, that.m_psz) != NULL;
316 else
317 return ::RTStrIStr(m_psz, that.m_psz) != NULL;
318}
319
320int MiniString::toInt(uint64_t &i) const
321{
322 if (!m_psz)
323 return VERR_NO_DIGITS;
324 return RTStrToUInt64Ex(m_psz, NULL, 0, &i);
325}
326
327int MiniString::toInt(uint32_t &i) const
328{
329 if (!m_psz)
330 return VERR_NO_DIGITS;
331 return RTStrToUInt32Ex(m_psz, NULL, 0, &i);
332}
333
Note: See TracBrowser for help on using the repository browser.

© 2024 Oracle Support Privacy / Do Not Sell My Info Terms of Use Trademark Policy Automated Access Etiquette