string.h revision e64031e20c39650a7bc902a3e1aba613b9415dee
/* $Id$ */
/** @file
* MS COM / XPCOM Abstraction Layer:
* Smart string classes declaration
*/
/*
* Copyright (C) 2006-2009 Oracle Corporation
*
* This file is part of VirtualBox Open Source Edition (OSE), as
* available from http://www.virtualbox.org. This file is free software;
* General Public License (GPL) as published by the Free Software
* Foundation, in version 2 as it comes in the "COPYING" file of the
* VirtualBox OSE distribution. VirtualBox OSE is distributed in the
* hope that it will be useful, but WITHOUT ANY WARRANTY of any kind.
*
* The contents of this file may alternatively be used under the terms
* of the Common Development and Distribution License Version 1.0
* (CDDL) only, as it comes in the "COPYING.CDDL" file of the
* VirtualBox OSE distribution, in which case the provisions of the
* CDDL are applicable instead of those of the GPL.
*
* You may elect to license modified versions of this file under the
* terms and conditions of either the GPL or the CDDL or both.
*/
#ifndef ___VBox_com_string_h
#define ___VBox_com_string_h
/* Make sure all the stdint.h macros are included - must come first! */
#ifndef __STDC_LIMIT_MACROS
# define __STDC_LIMIT_MACROS
#endif
#ifndef __STDC_CONSTANT_MACROS
# define __STDC_CONSTANT_MACROS
#endif
#if defined (VBOX_WITH_XPCOM)
# include <nsMemory.h>
#endif
{
// global constant in glue/string.cpp that represents an empty BSTR
extern const BSTR g_bstrEmpty;
/**
* String class used universally in Main for COM-style Utf-16 strings.
* Unfortunately COM on Windows uses UTF-16 everywhere, requiring conversions
* back and forth since most of VirtualBox and our libraries use UTF-8.
*
* To make things more obscure, on Windows, a COM-style BSTR is not just a
* pointer to a null-terminated wide character array, but the four bytes
* (32 bits) BEFORE the memory that the pointer points to are a length
* DWORD. One must therefore avoid pointer arithmetic and always use
* SysAllocString and the like to deal with BSTR pointers, which manage
* that DWORD correctly.
*
* For platforms other than Windows, we provide our own versions of the
* Sys* functions in Main/xpcom/helpers.cpp which do NOT use length
* prefixes though to be compatible with how XPCOM allocates string
* parameters to public functions.
*
* The Bstr class hides all this handling behind a std::string-like interface
* and also provides automatic conversions to MiniString and Utf8Str instances.
*
* The one advantage of using the SysString* routines is that this makes it
* and pass their values to callers through component methods' output parameters
* using the #cloneTo() operation. Also, the class can adopt (take ownership of)
* string buffers returned in output parameters of COM methods using the
* #asOutParam() operation and correctly free them afterwards.
*
* Starting with VirtualBox 3.2, like Utf8Str, Bstr no longer differentiates
* between NULL strings and empty strings. In other words, Bstr("") and
* Bstr(NULL) behave the same. In both cases, Bstr allocates no memory,
* reports a zero length and zero allocated bytes for both, and returns an
* empty C wide string from raw().
*/
{
Bstr()
{ }
{
}
{
}
#if defined (VBOX_WITH_XPCOM)
{
}
#endif
{
}
{
}
~Bstr()
{
setNull();
}
{
cleanup();
return *this;
}
{
cleanup();
return *this;
}
#if defined (VBOX_WITH_XPCOM)
{
cleanup();
return *this;
}
#endif
{
cleanup();
return *this;
}
/** Case sensitivity selector. */
enum CaseSensitivity
{
};
/**
* Compares the member string to str.
* @param str
* @param cs Whether comparison should be case-sensitive.
* @return
*/
{
if (cs == CaseSensitive)
}
{
}
/**
* Returns true if the member string has no length.
* This is true for instances created from both NULL and "" input strings.
*
* @note Always use this method to check if an instance is empty. Do not
* use length() because that may need to run through the entire string
* (Bstr does not cache string lengths). Also do not use operator bool();
* for one, MSVC is really annoying with its thinking that that is ambiguous,
* and even though operator bool() is protected with Bstr, at least gcc uses
* operator CBSTR() when a construct like "if (string)" is encountered, which
* is always true now since it raw() never returns an empty string. Again,
* always use isEmpty() even though if (string) may compile!
*/
/**
* Returns true if the member string is not empty. I'd like to make this
* private but since we require operator BSTR() it's futile anyway because
* the compiler will then (wrongly) use that one instead. Also if this is
* private the odd WORKAROUND_MSVC7_ERROR_C2593_FOR_BOOL_OP macro below
* will fail on Windows.
*/
operator bool() const
{
}
/**
* Returns a pointer to the raw member UTF-16 string. If the member string is empty,
* returns a pointer to a global variable containing an empty BSTR with a proper zero
* length prefix so that Windows is happy.
*/
{
if (m_bstr)
return m_bstr;
return g_bstrEmpty;
}
/**
* Convenience operator so that Bstr's can be passed to CBSTR input parameters
* of COM methods.
*/
/**
* Convenience operator so that Bstr's can be passed to CBSTR input parameters
* of COM methods. Unfortunately this is required for Windows since with
* MSCOM, input BSTR parameters of interface methods are not const.
*/
/**
* Returns a non-const raw pointer that allows to modify the string directly.
* As opposed to raw(), this DOES return NULL if the member string is empty
* because we cannot return a mutable pointer to the global variable with the
* empty string.
*
* @warning
* Be sure not to modify data beyond the allocated memory! The
* guaranteed size of the allocated memory is at least #length()
* bytes after creation and after every assignment operation.
*/
/**
* Intended to assign copies of instances to |BSTR| out parameters from
* within the interface method. Transfers the ownership of the duplicated
* string to the caller.
*
* If the member string is empty, this allocates an empty BSTR in *pstr
* (i.e. makes it point to a new buffer with a null byte).
*/
{
if (pstr)
{
#ifdef RT_EXCEPTIONS_ENABLED
if (!*pstr)
#endif
}
}
/**
* Intended to assign instances to |BSTR| out parameters from within the
* interface method. Transfers the ownership of the original string to the
* caller and resets the instance to null.
*
* As opposed to cloneTo(), this method doesn't create a copy of the
* string.
*
* If the member string is empty, this allocates an empty BSTR in *pstr
* (i.e. makes it point to a new buffer with a null byte).
*/
{
if (m_bstr)
else
{
// allocate null BSTR
#ifdef RT_EXCEPTIONS_ENABLED
if (!*pstr)
#endif
}
}
/**
* Intended to pass instances as |BSTR| out parameters to methods.
* Takes the ownership of the returned data.
*/
BSTR* asOutParam()
{
cleanup();
return &m_bstr;
}
/**
* Static immutable null object. May be used for comparison purposes.
*/
void cleanup()
{
if (m_bstr)
{
::SysFreeString(m_bstr);
}
}
/**
* Protected internal helper to copy a string. This ignores the previous object
* state, so either call this from a constructor or call cleanup() first.
*
* This variant copies from a zero-terminated UTF-16 string (which need not
* be a BSTR, i.e. need not have a length prefix).
*
* If the source is empty, this sets the member string to NULL.
* @param rs
*/
{
{
#ifdef RT_EXCEPTIONS_ENABLED
if (!m_bstr)
#endif
}
else
}
/**
* Protected internal helper to copy a string. This ignores the previous object
* state, so either call this from a constructor or call cleanup() first.
*
* This variant copies and converts from a zero-terminated UTF-8 string.
*
* If the source is empty, this sets the member string to NULL.
* @param rs
*/
{
{
::RTStrToUtf16(rs, &s);
#ifdef RT_EXCEPTIONS_ENABLED
if (!s)
#endif
::RTUtf16Free(s);
}
else
}
};
/* symmetric compare operators */
// work around error C2593 of the stupid MSVC 7.x ambiguity resolver
////////////////////////////////////////////////////////////////////////////////
/**
* String class used universally in Main for UTF-8 strings.
*
* This is based on iprt::MiniString, to which some functionality has been
* moved. Here we keep things that are specific to Main, such as conversions
* with UTF-16 strings (Bstr).
*
* Like iprt::MiniString, Utf8Str does not differentiate between NULL strings
* and empty strings. In other words, Utf8Str("") and Utf8Str(NULL)
* behave the same. In both cases, MiniString allocates no memory, reports
* a zero length and zero allocated bytes for both, and returns an empty
* C string from c_str().
*/
{
Utf8Str() {}
: MiniString(that)
{}
: MiniString(that)
{}
{
}
{
}
{
return *this;
}
{
return *this;
}
{
cleanup();
return *this;
}
{
cleanup();
return *this;
}
#if defined (VBOX_WITH_XPCOM)
/**
* Intended to assign instances to |char *| out parameters from within the
* interface method. Transfers the ownership of the duplicated string to the
* caller.
*
* This allocates a single 0 byte in the target if the member string is empty.
*
* This uses XPCOM memory allocation and thus only works on XPCOM. MSCOM doesn't
* like char* strings anyway.
*/
#endif
/**
* Intended to assign instances to |BSTR| out parameters from within the
* interface method. Transfers the ownership of the duplicated string to the
* caller.
*/
{
if (pstr)
{
}
}
/**
* Converts "this" to lower case by calling RTStrToLower().
* @return
*/
/**
* Converts "this" to upper case by calling RTStrToUpper().
* @return
*/
/**
* Removes a trailing slash from the member string, if present.
* Calls RTPathStripTrailingSlash() without having to mess with mutableRaw().
*/
void stripTrailingSlash();
/**
* Removes a trailing filename from the member string, if present.
* Calls RTPathStripFilename() without having to mess with mutableRaw().
*/
void stripFilename();
/**
* Removes a trailing file name extension from the member string, if present.
* Calls RTPathStripExt() without having to mess with mutableRaw().
*/
void stripExt();
/**
* Attempts to convert the member string into a 32-bit integer.
*
* @returns 32-bit unsigned number on success.
* @returns 0 on failure.
*/
int toInt32() const
{
return RTStrToInt32(m_psz);
}
/**
* Attempts to convert the member string into an unsigned 32-bit integer.
*
* @returns 32-bit unsigned number on success.
* @returns 0 on failure.
*/
int toUInt32() const
{
return RTStrToUInt32(m_psz);
}
/**
* Static immutable null object. May be used for comparison purposes.
*/
/**
* As with the ministring::copyFrom() variants, this unconditionally
* sets the members to a copy of the given other strings and makes
* no assumptions about previous contents. This can therefore be used
* both in copy constructors, when member variables have no defined
* value, and in assignments after having called cleanup().
*
* This variant converts from a UTF-16 string, most probably from
* a Bstr assignment.
*
* @param rs
*/
{
if (s && *s)
{
RTUtf16ToUtf8((PRTUTF16)s, &m_psz); /** @todo r=bird: This isn't throwing std::bad_alloc / handling return codes.
* Also, this technically requires using RTStrFree, ministring::cleanup() uses RTMemFree. */
}
else
{
m_cbLength = 0;
m_cbAllocated = 0;
}
}
};
/**
* This class is a printf-like formatter for Utf8Str strings. Its purpose is
* to construct Utf8Str objects from a format string and a list of arguments
* for the format string.
*
* The usage of this class is like the following:
* <code>
* Utf8StrFmt string ("program name = %s", argv[0]);
* </code>
*/
{
/**
* Constructs a new string given the format string and the list
* of the arguments for the format string.
*
* @param format printf-like format string (in UTF-8 encoding)
* @param ... list of the arguments for the format string
*/
{
}
Utf8StrFmt() {}
};
/**
* This class is a vprintf-like formatter for Utf8Str strings. It is
* identical to Utf8StrFmt except that its constructor takes a va_list
* argument instead of ellipsis.
*
* Note that a separate class is necessary because va_list is defined as
* |char *| on most platforms. For this reason, if we had two overloaded
* constructors in Utf8StrFmt (one taking ellipsis and another one taking
* va_list) then composing a constructor call using exactly two |char *|
* arguments would cause the compiler to use the va_list overload instead of
* the ellipsis one which is obviously wrong. The compiler would choose
* va_list because ellipsis has the lowest rank when it comes to resolving
* overloads, as opposed to va_list which is an exact match for |char *|.
*/
{
/**
* Constructs a new string given the format string and the list
* of the arguments for the format string.
*
* @param format printf-like format string (in UTF-8 encoding)
* @param args list of arguments for the format string
*/
};
/**
* The BstrFmt class is a shortcut to <tt>Bstr(Utf8StrFmt(...))</tt>.
*/
{
/**
* Constructs a new string given the format string and the list of the
* arguments for the format string.
*
* @param aFormat printf-like format string (in UTF-8 encoding).
* @param ... List of the arguments for the format string.
*/
{
}
};
/**
* The BstrFmtVA class is a shortcut to <tt>Bstr(Utf8StrFmtVA(...))</tt>.
*/
{
/**
* Constructs a new string given the format string and the list of the
* arguments for the format string.
*
* @param aFormat printf-like format string (in UTF-8 encoding).
* @param aArgs List of arguments for the format string
*/
{
}
};
} /* namespace com */
#endif /* !___VBox_com_string_h */