1 | /* $Id: ministring.cpp 35567 2011-01-14 14:16:45Z vboxsync $ */
|
---|
2 | /** @file
|
---|
3 | * IPRT - Mini C++ string class.
|
---|
4 | *
|
---|
5 | * This is a base for both Utf8Str and other places where IPRT may want to use
|
---|
6 | * a lean C++ string class.
|
---|
7 | */
|
---|
8 |
|
---|
9 | /*
|
---|
10 | * Copyright (C) 2007-2010 Oracle Corporation
|
---|
11 | *
|
---|
12 | * This file is part of VirtualBox Open Source Edition (OSE), as
|
---|
13 | * available from http://www.virtualbox.org. This file is free software;
|
---|
14 | * you can redistribute it and/or modify it under the terms of the GNU
|
---|
15 | * General Public License (GPL) as published by the Free Software
|
---|
16 | * Foundation, in version 2 as it comes in the "COPYING" file of the
|
---|
17 | * VirtualBox OSE distribution. VirtualBox OSE is distributed in the
|
---|
18 | * hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
|
---|
19 | *
|
---|
20 | * The contents of this file may alternatively be used under the terms
|
---|
21 | * of the Common Development and Distribution License Version 1.0
|
---|
22 | * (CDDL) only, as it comes in the "COPYING.CDDL" file of the
|
---|
23 | * VirtualBox OSE distribution, in which case the provisions of the
|
---|
24 | * CDDL are applicable instead of those of the GPL.
|
---|
25 | *
|
---|
26 | * You may elect to license modified versions of this file under the
|
---|
27 | * terms and conditions of either the GPL or the CDDL or both.
|
---|
28 | */
|
---|
29 |
|
---|
30 |
|
---|
31 | /*******************************************************************************
|
---|
32 | * Header Files *
|
---|
33 | *******************************************************************************/
|
---|
34 | #include <iprt/cpp/ministring.h>
|
---|
35 | using namespace iprt;
|
---|
36 |
|
---|
37 |
|
---|
38 | /*******************************************************************************
|
---|
39 | * Global Variables *
|
---|
40 | *******************************************************************************/
|
---|
41 | const size_t MiniString::npos = ~(size_t)0;
|
---|
42 |
|
---|
43 | /*******************************************************************************
|
---|
44 | * Defined Constants And Macros *
|
---|
45 | *******************************************************************************/
|
---|
46 | /** Allocation block alignment used when appending bytes to a string. */
|
---|
47 | #define IPRT_MINISTRING_APPEND_ALIGNMENT 64
|
---|
48 |
|
---|
49 |
|
---|
50 | MiniString &MiniString::printf(const char *pszFormat, ...)
|
---|
51 | {
|
---|
52 | va_list va;
|
---|
53 | va_start(va, pszFormat);
|
---|
54 | printfV(pszFormat, va);
|
---|
55 | va_end(va);
|
---|
56 | return *this;
|
---|
57 | }
|
---|
58 |
|
---|
59 | /**
|
---|
60 | * Callback used with RTStrFormatV by MiniString::printfV.
|
---|
61 | *
|
---|
62 | * @returns The number of bytes added (not used).
|
---|
63 | *
|
---|
64 | * @param pvArg The string object.
|
---|
65 | * @param pachChars The characters to append.
|
---|
66 | * @param cbChars The number of characters. 0 on the final callback.
|
---|
67 | */
|
---|
68 | /*static*/ DECLCALLBACK(size_t)
|
---|
69 | MiniString::printfOutputCallback(void *pvArg, const char *pachChars, size_t cbChars)
|
---|
70 | {
|
---|
71 | MiniString *pThis = (MiniString *)pvArg;
|
---|
72 | if (cbChars)
|
---|
73 | {
|
---|
74 | size_t cchBoth = pThis->m_cch + cbChars;
|
---|
75 | if (cchBoth >= pThis->m_cbAllocated)
|
---|
76 | {
|
---|
77 | /* Double the buffer size, if it's less that _4M. Align sizes like
|
---|
78 | for append. */
|
---|
79 | size_t cbAlloc = RT_ALIGN_Z(pThis->m_cbAllocated, IPRT_MINISTRING_APPEND_ALIGNMENT);
|
---|
80 | cbAlloc += RT_MIN(cbAlloc, _4M);
|
---|
81 | if (cbAlloc <= cchBoth)
|
---|
82 | cbAlloc = RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT);
|
---|
83 | pThis->reserve(cbAlloc);
|
---|
84 | #ifndef RT_EXCEPTIONS_ENABLED
|
---|
85 | AssertReleaseReturn(pThis->capacity() > cchBoth, 0);
|
---|
86 | #endif
|
---|
87 | }
|
---|
88 |
|
---|
89 | memcpy(&pThis->m_psz[pThis->m_cch], pachChars, cbChars);
|
---|
90 | pThis->m_cch = cchBoth;
|
---|
91 | pThis->m_psz[cchBoth] = '\0';
|
---|
92 | }
|
---|
93 | return cbChars;
|
---|
94 | }
|
---|
95 |
|
---|
96 | MiniString &MiniString::printfV(const char *pszFormat, va_list va)
|
---|
97 | {
|
---|
98 | cleanup();
|
---|
99 | RTStrFormatV(printfOutputCallback, this, NULL, NULL, pszFormat, va);
|
---|
100 | return *this;
|
---|
101 | }
|
---|
102 |
|
---|
103 | MiniString &MiniString::append(const MiniString &that)
|
---|
104 | {
|
---|
105 | size_t cchThat = that.length();
|
---|
106 | if (cchThat)
|
---|
107 | {
|
---|
108 | size_t cchThis = length();
|
---|
109 | size_t cchBoth = cchThis + cchThat;
|
---|
110 |
|
---|
111 | if (cchBoth >= m_cbAllocated)
|
---|
112 | {
|
---|
113 | reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
|
---|
114 | // calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
|
---|
115 | #ifndef RT_EXCEPTIONS_ENABLED
|
---|
116 | AssertRelease(capacity() > cchBoth);
|
---|
117 | #endif
|
---|
118 | }
|
---|
119 |
|
---|
120 | memcpy(m_psz + cchThis, that.m_psz, cchThat);
|
---|
121 | m_psz[cchBoth] = '\0';
|
---|
122 | m_cch = cchBoth;
|
---|
123 | }
|
---|
124 | return *this;
|
---|
125 | }
|
---|
126 |
|
---|
127 | MiniString &MiniString::append(const char *pszThat)
|
---|
128 | {
|
---|
129 | size_t cchThat = strlen(pszThat);
|
---|
130 | if (cchThat)
|
---|
131 | {
|
---|
132 | size_t cchThis = length();
|
---|
133 | size_t cchBoth = cchThis + cchThat;
|
---|
134 |
|
---|
135 | if (cchBoth >= m_cbAllocated)
|
---|
136 | {
|
---|
137 | reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
|
---|
138 | // calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
|
---|
139 | #ifndef RT_EXCEPTIONS_ENABLED
|
---|
140 | AssertRelease(capacity() > cchBoth);
|
---|
141 | #endif
|
---|
142 | }
|
---|
143 |
|
---|
144 | memcpy(&m_psz[cchThis], pszThat, cchThat);
|
---|
145 | m_psz[cchBoth] = '\0';
|
---|
146 | m_cch = cchBoth;
|
---|
147 | }
|
---|
148 | return *this;
|
---|
149 | }
|
---|
150 |
|
---|
151 | MiniString& MiniString::append(char ch)
|
---|
152 | {
|
---|
153 | Assert((unsigned char)ch < 0x80); /* Don't create invalid UTF-8. */
|
---|
154 | if (ch)
|
---|
155 | {
|
---|
156 | // allocate in chunks of 20 in case this gets called several times
|
---|
157 | if (m_cch + 1 >= m_cbAllocated)
|
---|
158 | {
|
---|
159 | reserve(RT_ALIGN_Z(m_cch + 2, IPRT_MINISTRING_APPEND_ALIGNMENT));
|
---|
160 | // calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
|
---|
161 | #ifndef RT_EXCEPTIONS_ENABLED
|
---|
162 | AssertRelease(capacity() > m_cch + 1);
|
---|
163 | #endif
|
---|
164 | }
|
---|
165 |
|
---|
166 | m_psz[m_cch] = ch;
|
---|
167 | m_psz[++m_cch] = '\0';
|
---|
168 | }
|
---|
169 | return *this;
|
---|
170 | }
|
---|
171 |
|
---|
172 | MiniString &MiniString::appendCodePoint(RTUNICP uc)
|
---|
173 | {
|
---|
174 | /*
|
---|
175 | * Single byte encoding.
|
---|
176 | */
|
---|
177 | if (uc < 0x80)
|
---|
178 | return MiniString::append((char)uc);
|
---|
179 |
|
---|
180 | /*
|
---|
181 | * Multibyte encoding.
|
---|
182 | * Assume max encoding length when resizing the string, that's simpler.
|
---|
183 | */
|
---|
184 | AssertReturn(uc <= UINT32_C(0x7fffffff), *this);
|
---|
185 |
|
---|
186 | if (m_cch + 6 >= m_cbAllocated)
|
---|
187 | {
|
---|
188 | reserve(RT_ALIGN_Z(m_cch + 6 + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
|
---|
189 | // calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
|
---|
190 | #ifndef RT_EXCEPTIONS_ENABLED
|
---|
191 | AssertRelease(capacity() > m_cch + 6);
|
---|
192 | #endif
|
---|
193 | }
|
---|
194 |
|
---|
195 | char *pszNext = RTStrPutCp(&m_psz[m_cch], uc);
|
---|
196 | m_cch = pszNext - m_psz;
|
---|
197 | *pszNext = '\0';
|
---|
198 |
|
---|
199 | return *this;
|
---|
200 | }
|
---|
201 |
|
---|
202 | size_t MiniString::find(const char *pcszFind, size_t pos /*= 0*/)
|
---|
203 | const
|
---|
204 | {
|
---|
205 | const char *pszThis, *p;
|
---|
206 |
|
---|
207 | if ( ((pszThis = c_str()))
|
---|
208 | && (pos < length())
|
---|
209 | && ((p = strstr(pszThis + pos, pcszFind)))
|
---|
210 | )
|
---|
211 | return p - pszThis;
|
---|
212 |
|
---|
213 | return npos;
|
---|
214 | }
|
---|
215 |
|
---|
216 | void MiniString::findReplace(char cFind, char cReplace)
|
---|
217 | {
|
---|
218 | for (size_t i = 0; i < length(); ++i)
|
---|
219 | {
|
---|
220 | char *p = &m_psz[i];
|
---|
221 | if (*p == cFind)
|
---|
222 | *p = cReplace;
|
---|
223 | }
|
---|
224 | }
|
---|
225 |
|
---|
226 | MiniString MiniString::substrCP(size_t pos /*= 0*/, size_t n /*= npos*/)
|
---|
227 | const
|
---|
228 | {
|
---|
229 | MiniString ret;
|
---|
230 |
|
---|
231 | if (n)
|
---|
232 | {
|
---|
233 | const char *psz;
|
---|
234 |
|
---|
235 | if ((psz = c_str()))
|
---|
236 | {
|
---|
237 | RTUNICP cp;
|
---|
238 |
|
---|
239 | // walk the UTF-8 characters until where the caller wants to start
|
---|
240 | size_t i = pos;
|
---|
241 | while (*psz && i--)
|
---|
242 | if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
|
---|
243 | return ret; // return empty string on bad encoding
|
---|
244 |
|
---|
245 | const char *pFirst = psz;
|
---|
246 |
|
---|
247 | if (n == npos)
|
---|
248 | // all the rest:
|
---|
249 | ret = pFirst;
|
---|
250 | else
|
---|
251 | {
|
---|
252 | i = n;
|
---|
253 | while (*psz && i--)
|
---|
254 | if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
|
---|
255 | return ret; // return empty string on bad encoding
|
---|
256 |
|
---|
257 | size_t cbCopy = psz - pFirst;
|
---|
258 | if (cbCopy)
|
---|
259 | {
|
---|
260 | ret.reserve(cbCopy + 1); // may throw bad_alloc
|
---|
261 | #ifndef RT_EXCEPTIONS_ENABLED
|
---|
262 | AssertRelease(capacity() >= cbCopy + 1);
|
---|
263 | #endif
|
---|
264 | memcpy(ret.m_psz, pFirst, cbCopy);
|
---|
265 | ret.m_cch = cbCopy;
|
---|
266 | ret.m_psz[cbCopy] = '\0';
|
---|
267 | }
|
---|
268 | }
|
---|
269 | }
|
---|
270 | }
|
---|
271 |
|
---|
272 | return ret;
|
---|
273 | }
|
---|
274 |
|
---|
275 | bool MiniString::endsWith(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
|
---|
276 | {
|
---|
277 | size_t l1 = length();
|
---|
278 | if (l1 == 0)
|
---|
279 | return false;
|
---|
280 |
|
---|
281 | size_t l2 = that.length();
|
---|
282 | if (l1 < l2)
|
---|
283 | return false;
|
---|
284 | /** @todo r=bird: If l2 is 0, then m_psz can be NULL and we will crash. See
|
---|
285 | * also handling of l2 == in startsWith. */
|
---|
286 |
|
---|
287 | size_t l = l1 - l2;
|
---|
288 | if (cs == CaseSensitive)
|
---|
289 | return ::RTStrCmp(&m_psz[l], that.m_psz) == 0;
|
---|
290 | else
|
---|
291 | return ::RTStrICmp(&m_psz[l], that.m_psz) == 0;
|
---|
292 | }
|
---|
293 |
|
---|
294 | bool MiniString::startsWith(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
|
---|
295 | {
|
---|
296 | size_t l1 = length();
|
---|
297 | size_t l2 = that.length();
|
---|
298 | if (l1 == 0 || l2 == 0) /** @todo r=bird: this differs from endsWith, and I think other IPRT code. If l2 == 0, it matches anything. */
|
---|
299 | return false;
|
---|
300 |
|
---|
301 | if (l1 < l2)
|
---|
302 | return false;
|
---|
303 |
|
---|
304 | if (cs == CaseSensitive)
|
---|
305 | return ::RTStrNCmp(m_psz, that.m_psz, l2) == 0;
|
---|
306 | else
|
---|
307 | return ::RTStrNICmp(m_psz, that.m_psz, l2) == 0;
|
---|
308 | }
|
---|
309 |
|
---|
310 | bool MiniString::contains(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
|
---|
311 | {
|
---|
312 | /** @todo r-bird: Not checking for NULL strings like startsWith does (and
|
---|
313 | * endsWith only does half way). */
|
---|
314 | if (cs == CaseSensitive)
|
---|
315 | return ::RTStrStr(m_psz, that.m_psz) != NULL;
|
---|
316 | else
|
---|
317 | return ::RTStrIStr(m_psz, that.m_psz) != NULL;
|
---|
318 | }
|
---|
319 |
|
---|
320 | int MiniString::toInt(uint64_t &i) const
|
---|
321 | {
|
---|
322 | if (!m_psz)
|
---|
323 | return VERR_NO_DIGITS;
|
---|
324 | return RTStrToUInt64Ex(m_psz, NULL, 0, &i);
|
---|
325 | }
|
---|
326 |
|
---|
327 | int MiniString::toInt(uint32_t &i) const
|
---|
328 | {
|
---|
329 | if (!m_psz)
|
---|
330 | return VERR_NO_DIGITS;
|
---|
331 | return RTStrToUInt32Ex(m_psz, NULL, 0, &i);
|
---|
332 | }
|
---|
333 |
|
---|