ministring.cpp revision 7f0bf7fc186a9b0de66702f6d1e44fcad695b73d
/* $Id$ */
/** @file
* IPRT - Mini C++ string class.
*
* This is a base for both Utf8Str and other places where IPRT may want to use
* a lean C++ string class.
*/
/*
* Copyright (C) 2007-2010 Oracle Corporation
*
* This file is part of VirtualBox Open Source Edition (OSE), as
* available from http://www.virtualbox.org. This file is free software;
* you can redistribute it and/or modify it under the terms of the GNU
* General Public License (GPL) as published by the Free Software
* Foundation, in version 2 as it comes in the "COPYING" file of the
* VirtualBox OSE distribution. VirtualBox OSE is distributed in the
* hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
*
* The contents of this file may alternatively be used under the terms
* of the Common Development and Distribution License Version 1.0
* (CDDL) only, as it comes in the "COPYING.CDDL" file of the
* VirtualBox OSE distribution, in which case the provisions of the
* CDDL are applicable instead of those of the GPL.
*
* You may elect to license modified versions of this file under the
* terms and conditions of either the GPL or the CDDL or both.
*/
/*******************************************************************************
* Header Files *
*******************************************************************************/
#include <iprt/cpp/ministring.h>
using namespace iprt;
/*******************************************************************************
* Global Variables *
*******************************************************************************/
const size_t MiniString::npos = ~(size_t)0;
/*******************************************************************************
* Defined Constants And Macros *
*******************************************************************************/
/** Allocation block alignment used when appending bytes to a string. */
#define IPRT_MINISTRING_APPEND_ALIGNMENT 64
MiniString &MiniString::printf(const char *pszFormat, ...)
{
va_list va;
va_start(va, pszFormat);
printfV(pszFormat, va);
va_end(va);
return *this;
}
/**
* Callback used with RTStrFormatV by MiniString::printfV.
*
* @returns The number of bytes added (not used).
*
* @param pvArg The string object.
* @param pachChars The characters to append.
* @param cbChars The number of characters. 0 on the final callback.
*/
/*static*/ DECLCALLBACK(size_t)
MiniString::printfOutputCallback(void *pvArg, const char *pachChars, size_t cbChars)
{
MiniString *pThis = (MiniString *)pvArg;
if (cbChars)
{
size_t cchBoth = pThis->m_cch + cbChars;
if (cchBoth >= pThis->m_cbAllocated)
{
/* Double the buffer size, if it's less that _4M. Align sizes like
for append. */
size_t cbAlloc = RT_ALIGN_Z(pThis->m_cbAllocated, IPRT_MINISTRING_APPEND_ALIGNMENT);
cbAlloc += RT_MIN(cbAlloc, _4M);
if (cbAlloc <= cchBoth)
cbAlloc = RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT);
pThis->reserve(cbAlloc);
#ifndef RT_EXCEPTIONS_ENABLED
AssertReleaseReturn(pThis->capacity() > cchBoth, 0);
#endif
}
memcpy(&pThis->m_psz[pThis->m_cch], pachChars, cbChars);
pThis->m_cch = cchBoth;
pThis->m_psz[cchBoth] = '\0';
}
return cbChars;
}
MiniString &MiniString::printfV(const char *pszFormat, va_list va)
{
cleanup();
RTStrFormatV(printfOutputCallback, this, NULL, NULL, pszFormat, va);
return *this;
}
MiniString &MiniString::append(const MiniString &that)
{
size_t cchThat = that.length();
if (cchThat)
{
size_t cchThis = length();
size_t cchBoth = cchThis + cchThat;
if (cchBoth >= m_cbAllocated)
{
reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
// calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
#ifndef RT_EXCEPTIONS_ENABLED
AssertRelease(capacity() > cchBoth);
#endif
}
memcpy(m_psz + cchThis, that.m_psz, cchThat);
m_psz[cchBoth] = '\0';
m_cch = cchBoth;
}
return *this;
}
MiniString &MiniString::append(const char *pszThat)
{
size_t cchThat = strlen(pszThat);
if (cchThat)
{
size_t cchThis = length();
size_t cchBoth = cchThis + cchThat;
if (cchBoth >= m_cbAllocated)
{
reserve(RT_ALIGN_Z(cchBoth + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
// calls realloc(cchBoth + 1) and sets m_cbAllocated; may throw bad_alloc.
#ifndef RT_EXCEPTIONS_ENABLED
AssertRelease(capacity() > cchBoth);
#endif
}
memcpy(&m_psz[cchThis], pszThat, cchThat);
m_psz[cchBoth] = '\0';
m_cch = cchBoth;
}
return *this;
}
MiniString& MiniString::append(char ch)
{
Assert((unsigned char)ch < 0x80); /* Don't create invalid UTF-8. */
if (ch)
{
// allocate in chunks of 20 in case this gets called several times
if (m_cch + 1 >= m_cbAllocated)
{
reserve(RT_ALIGN_Z(m_cch + 2, IPRT_MINISTRING_APPEND_ALIGNMENT));
// calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
#ifndef RT_EXCEPTIONS_ENABLED
AssertRelease(capacity() > m_cch + 1);
#endif
}
m_psz[m_cch] = ch;
m_psz[++m_cch] = '\0';
}
return *this;
}
MiniString &MiniString::appendCodePoint(RTUNICP uc)
{
/*
* Single byte encoding.
*/
if (uc < 0x80)
return MiniString::append((char)uc);
/*
* Multibyte encoding.
* Assume max encoding length when resizing the string, that's simpler.
*/
AssertReturn(uc <= UINT32_C(0x7fffffff), *this);
if (m_cch + 6 >= m_cbAllocated)
{
reserve(RT_ALIGN_Z(m_cch + 6 + 1, IPRT_MINISTRING_APPEND_ALIGNMENT));
// calls realloc(cbBoth) and sets m_cbAllocated; may throw bad_alloc.
#ifndef RT_EXCEPTIONS_ENABLED
AssertRelease(capacity() > m_cch + 6);
#endif
}
char *pszNext = RTStrPutCp(&m_psz[m_cch], uc);
m_cch = pszNext - m_psz;
*pszNext = '\0';
return *this;
}
size_t MiniString::find(const char *pcszFind, size_t pos /*= 0*/)
const
{
const char *pszThis, *p;
if ( ((pszThis = c_str()))
&& (pos < length())
&& ((p = strstr(pszThis + pos, pcszFind)))
)
return p - pszThis;
return npos;
}
void MiniString::findReplace(char cFind, char cReplace)
{
for (size_t i = 0; i < length(); ++i)
{
char *p = &m_psz[i];
if (*p == cFind)
*p = cReplace;
}
}
MiniString MiniString::substrCP(size_t pos /*= 0*/, size_t n /*= npos*/)
const
{
MiniString ret;
if (n)
{
const char *psz;
if ((psz = c_str()))
{
RTUNICP cp;
// walk the UTF-8 characters until where the caller wants to start
size_t i = pos;
while (*psz && i--)
if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
return ret; // return empty string on bad encoding
const char *pFirst = psz;
if (n == npos)
// all the rest:
ret = pFirst;
else
{
i = n;
while (*psz && i--)
if (RT_FAILURE(RTStrGetCpEx(&psz, &cp)))
return ret; // return empty string on bad encoding
size_t cbCopy = psz - pFirst;
if (cbCopy)
{
ret.reserve(cbCopy + 1); // may throw bad_alloc
#ifndef RT_EXCEPTIONS_ENABLED
AssertRelease(capacity() >= cbCopy + 1);
#endif
memcpy(ret.m_psz, pFirst, cbCopy);
ret.m_cch = cbCopy;
ret.m_psz[cbCopy] = '\0';
}
}
}
}
return ret;
}
bool MiniString::endsWith(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
{
size_t l1 = length();
if (l1 == 0)
return false;
size_t l2 = that.length();
if (l1 < l2)
return false;
/** @todo r=bird: If l2 is 0, then m_psz can be NULL and we will crash. See
* also handling of l2 == in startsWith. */
size_t l = l1 - l2;
if (cs == CaseSensitive)
return ::RTStrCmp(&m_psz[l], that.m_psz) == 0;
else
return ::RTStrICmp(&m_psz[l], that.m_psz) == 0;
}
bool MiniString::startsWith(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
{
size_t l1 = length();
size_t l2 = that.length();
if (l1 == 0 || l2 == 0) /** @todo r=bird: this differs from endsWith, and I think other IPRT code. If l2 == 0, it matches anything. */
return false;
if (l1 < l2)
return false;
if (cs == CaseSensitive)
return ::RTStrNCmp(m_psz, that.m_psz, l2) == 0;
else
return ::RTStrNICmp(m_psz, that.m_psz, l2) == 0;
}
bool MiniString::contains(const MiniString &that, CaseSensitivity cs /*= CaseSensitive*/) const
{
/** @todo r-bird: Not checking for NULL strings like startsWith does (and
* endsWith only does half way). */
if (cs == CaseSensitive)
return ::RTStrStr(m_psz, that.m_psz) != NULL;
else
return ::RTStrIStr(m_psz, that.m_psz) != NULL;
}
int MiniString::toInt(uint64_t &i) const
{
if (!m_psz)
return VERR_NO_DIGITS;
return RTStrToUInt64Ex(m_psz, NULL, 0, &i);
}
int MiniString::toInt(uint32_t &i) const
{
if (!m_psz)
return VERR_NO_DIGITS;
return RTStrToUInt32Ex(m_psz, NULL, 0, &i);
}
iprt::list<iprt::MiniString, iprt::MiniString*> MiniString::split(const iprt::MiniString &strSep, SplitMode mode /* = RemoveEmptyParts */)
{
iprt::list<iprt::MiniString> res;
if (!m_psz)
return res;
if (strSep.isEmpty())
{
res.append(iprt::MiniString(m_psz));
return res;
}
size_t cch = m_cch;
char *pszTmp = m_psz;
while(cch > 0)
{
char *pszNext = strstr(pszTmp, strSep.c_str());
if (!pszNext)
break;
size_t chNext = pszNext - pszTmp;
if ( chNext > 0
|| mode == KeepEmptyParts)
res.append(iprt::MiniString(pszTmp, chNext));
pszTmp += chNext + strSep.length();
cch -= chNext + strSep.length();
}
/* Some characters left at the end? */
if (cch > 0)
res.append(iprt::MiniString(pszTmp, cch));
return res;
}
/* static */
iprt::MiniString MiniString::join(const iprt::list<iprt::MiniString, iprt::MiniString*> &list, const iprt::MiniString &strSep /* = "" */)
{
MiniString res;
if (list.size() > 1)
{
for(size_t i = 0; i < list.size() - 1; ++i)
res += list.at(i) + strSep;
res += list.last();
}
return res;
}
const iprt::MiniString operator+(const iprt::MiniString &one, const iprt::MiniString &other)
{
iprt::MiniString res(one);
return res += other;
}
const iprt::MiniString operator+(const iprt::MiniString &one, const char *pcszOther)
{
iprt::MiniString res(one);
return res += pcszOther;
}
const iprt::MiniString operator+(const char *pcszOne, const iprt::MiniString &other)
{
iprt::MiniString res(pcszOne);
return res += other;
}