33#if U_SHOW_CPLUSPLUS_API
56#if !UCONFIG_NO_BREAK_ITERATION
75 char16_t *dest, int32_t destCapacity,
76 const char16_t *src, int32_t srcLength,
83class StringCharacterIterator;
84class UnicodeStringAppendable;
98#define US_INV icu::UnicodeString::kInvariant
120#if !U_CHAR16_IS_TYPEDEF
121# define UNICODE_STRING(cs, _length) icu::UnicodeString(true, u ## cs, _length)
123# define UNICODE_STRING(cs, _length) icu::UnicodeString(true, (const char16_t*)u ## cs, _length)
135#define UNICODE_STRING_SIMPLE(cs) UNICODE_STRING(cs, -1)
144#ifndef UNISTR_FROM_CHAR_EXPLICIT
145# if defined(U_COMBINED_IMPLEMENTATION) || defined(U_COMMON_IMPLEMENTATION) || defined(U_I18N_IMPLEMENTATION) || defined(U_IO_IMPLEMENTATION)
147# define UNISTR_FROM_CHAR_EXPLICIT explicit
150# define UNISTR_FROM_CHAR_EXPLICIT
164#ifndef UNISTR_FROM_STRING_EXPLICIT
165# if defined(U_COMBINED_IMPLEMENTATION) || defined(U_COMMON_IMPLEMENTATION) || defined(U_I18N_IMPLEMENTATION) || defined(U_IO_IMPLEMENTATION)
167# define UNISTR_FROM_STRING_EXPLICIT explicit
170# define UNISTR_FROM_STRING_EXPLICIT
207#ifndef UNISTR_OBJECT_SIZE
208# define UNISTR_OBJECT_SIZE 64
330#ifndef U_HIDE_DRAFT_API
346 template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
348 std::u16string_view
sv(internal::toU16StringView(text));
350 return !isBogus() && (len =
length()) ==
sv.length() && doEquals(
sv.data(), len);
363#ifndef U_HIDE_DRAFT_API
381 template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
1122 inline int32_t indexOf(
char16_t c)
const;
1142 inline int32_t indexOf(
char16_t c,
1167 inline int32_t indexOf(
char16_t c,
1305 inline int32_t lastIndexOf(
char16_t c)
const;
1325 inline int32_t lastIndexOf(
char16_t c,
1350 inline int32_t lastIndexOf(
char16_t c,
1508 inline void extract(
int32_t start,
1547 inline void extract(
int32_t start,
1606#if U_CHARSET_IS_UTF8 || !UCONFIG_NO_CONVERSION
1634#if !UCONFIG_NO_CONVERSION
1664 const char*
codepage =
nullptr)
const;
1776 template<
typename StringClass>
1859 inline UBool isEmpty()
const;
1870 inline int32_t getCapacity()
const;
1879 inline int32_t hashCode()
const;
1893 inline UBool isBogus()
const;
1948#ifndef U_HIDE_DRAFT_API
1959 template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
1962 return doReplace(0,
length(), internal::toU16StringView(
src));
2215#ifndef U_HIDE_DRAFT_API
2226 template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
2228 return doAppend(internal::toU16StringView(
src));
2288#ifndef U_HIDE_DRAFT_API
2299 template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
2301 return doAppend(internal::toU16StringView(
src));
2782#if !UCONFIG_NO_BREAK_ITERATION
2991 inline const char16_t *getBuffer()
const;
3028#ifndef U_HIDE_DRAFT_API
3035 inline operator std::u16string_view()
const {
3036 return {getBuffer(),
static_cast<std::u16string_view::size_type
>(
length())};
3039#if U_SIZEOF_WCHAR_T==2 || defined(U_IN_DOXYGEN)
3049 inline operator std::wstring_view()
const {
3050 const char16_t *p = getBuffer();
3051#ifdef U_ALIASING_BARRIER
3054 return {
reinterpret_cast<const wchar_t *
>(p), (std::wstring_view::size_type)
length() };
3103#ifdef U_HIDE_DRAFT_API
3127#if !U_CHAR16_IS_TYPEDEF && \
3128 (defined(U_HIDE_DRAFT_API) || (defined(_LIBCPP_VERSION) && _LIBCPP_VERSION >= 180000))
3152#if defined(U_HIDE_DRAFT_API) && (U_SIZEOF_WCHAR_T==2 || defined(U_IN_DOXYGEN))
3174 UnicodeString(ConstChar16Ptr(text), -1) {}
3208#if !U_CHAR16_IS_TYPEDEF
3229#if U_SIZEOF_WCHAR_T==2 || defined(U_IN_DOXYGEN)
3260#ifndef U_HIDE_DRAFT_API
3273 template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
3275 fUnion.fFields.fLengthAndFlags = kShortString;
3276 doAppend(internal::toU16StringViewNullable(text));
3334#if !U_CHAR16_IS_TYPEDEF
3347#if U_SIZEOF_WCHAR_T==2 || defined(U_IN_DOXYGEN)
3371#if U_CHARSET_IS_UTF8 || !UCONFIG_NO_CONVERSION
3410#if !UCONFIG_NO_CONVERSION
3576#ifndef U_HIDE_DRAFT_API
3599 template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
3601 return readOnlyAliasFromU16StringView(internal::toU16StringView(text));
3624 return readOnlyAliasFromUnicodeString(text);
3755 static UnicodeString readOnlyAliasFromU16StringView(std::u16string_view text);
3767 char *target,
int32_t capacity)
const;
3774 return doEquals(text.getArrayStart(), len);
3776 UBool doEquals(
const char16_t *text,
int32_t len)
const;
3779 doEqualsSubstring(
int32_t start,
3805 doCompareCodePointOrder(
int32_t start,
3841 int32_t doLastIndexOf(
char16_t c,
3854 inline void doExtract(
int32_t start,
3858 inline char16_t doCharAt(
int32_t offset)
const;
3885 inline char16_t* getArrayStart();
3886 inline const char16_t* getArrayStart()
const;
3888 inline UBool hasShortLength()
const;
3889 inline int32_t getShortLength()
const;
3893 inline UBool isWritable()
const;
3896 inline UBool isBufferWritable()
const;
3899 inline void setZeroLength();
3900 inline void setShortLength(
int32_t len);
3901 inline void setLength(
int32_t len);
3902 inline void setToEmpty();
3903 inline void setArray(
char16_t *array,
int32_t len,
int32_t capacity);
3913 void releaseArray();
3925 inline void pinIndex(
int32_t& start)
const;
3926 inline void pinIndices(
int32_t& start,
3929#if !UCONFIG_NO_CONVERSION
4005 kInvalidUChar=0xffff,
4011 kUsingStackBuffer=2,
4013 kBufferIsReadonly=8,
4016 kAllStorageFlags=0x1f,
4019 kLength1=1<<kLengthShift,
4020 kMaxShortLength=0x3ff,
4021 kLengthIsLarge=0xffe0,
4024 kShortString=kUsingStackBuffer,
4025 kLongString=kRefCounted,
4026 kReadonlyAlias=kBufferIsReadonly,
4030 friend class UnicodeStringAppendable;
4032 union StackBufferOrFields;
4033 friend union StackBufferOrFields;
4076 union StackBufferOrFields {
4080 int16_t fLengthAndFlags;
4081 char16_t fBuffer[US_STACKBUF_SIZE];
4084 int16_t fLengthAndFlags;
4105#ifndef U_HIDE_DRAFT_API
4116template<
typename S,
typename = std::enable_if_t<ConvertibleToU16StringView<S>>>
4122#ifndef U_FORCE_HIDE_INTERNAL_API
4137UnicodeString::pinIndex(
int32_t& start)
const
4142 }
else if(start > length()) {
4148UnicodeString::pinIndices(int32_t& start,
4149 int32_t& _length)
const
4152 int32_t len = length();
4155 }
else if(start > len) {
4160 }
else if(_length > (len - start)) {
4161 _length = (len - start);
4166UnicodeString::getArrayStart() {
4167 return (fUnion.fFields.fLengthAndFlags&kUsingStackBuffer) ?
4168 fUnion.fStackFields.fBuffer : fUnion.fFields.fArray;
4171inline const char16_t*
4172UnicodeString::getArrayStart()
const {
4173 return (fUnion.fFields.fLengthAndFlags&kUsingStackBuffer) ?
4174 fUnion.fStackFields.fBuffer : fUnion.fFields.fArray;
4182UnicodeString::UnicodeString() {
4183 fUnion.fStackFields.fLengthAndFlags=kShortString;
4186inline UnicodeString::UnicodeString(
const std::nullptr_t ) {
4187 fUnion.fStackFields.fLengthAndFlags=kShortString;
4190inline UnicodeString::UnicodeString(
const std::nullptr_t ,
int32_t ) {
4191 fUnion.fStackFields.fLengthAndFlags=kShortString;
4195 fUnion.fStackFields.fLengthAndFlags=kShortString;
4202UnicodeString::hasShortLength()
const {
4203 return fUnion.fFields.fLengthAndFlags>=0;
4207UnicodeString::getShortLength()
const {
4210 return fUnion.fFields.fLengthAndFlags>>kLengthShift;
4214UnicodeString::length()
const {
4215 return hasShortLength() ? getShortLength() : fUnion.fFields.fLength;
4219UnicodeString::getCapacity()
const {
4220 return (fUnion.fFields.fLengthAndFlags&kUsingStackBuffer) ?
4221 US_STACKBUF_SIZE : fUnion.fFields.fCapacity;
4225UnicodeString::hashCode()
const
4226{
return doHashCode(); }
4229UnicodeString::isBogus()
const
4230{
return fUnion.fFields.fLengthAndFlags & kIsBogus; }
4233UnicodeString::isWritable()
const
4234{
return !(fUnion.fFields.fLengthAndFlags & (kOpenGetBuffer | kIsBogus)); }
4237UnicodeString::isBufferWritable()
const
4240 !(fUnion.fFields.fLengthAndFlags&(kOpenGetBuffer|kIsBogus|kBufferIsReadonly)) &&
4241 (!(fUnion.fFields.fLengthAndFlags&kRefCounted) || refCount()==1);
4244inline const char16_t *
4245UnicodeString::getBuffer()
const {
4246 if(fUnion.fFields.fLengthAndFlags&(kIsBogus|kOpenGetBuffer)) {
4248 }
else if(fUnion.fFields.fLengthAndFlags&kUsingStackBuffer) {
4249 return fUnion.fStackFields.fBuffer;
4251 return fUnion.fFields.fArray;
4259UnicodeString::doCompare(
int32_t start,
4266 return static_cast<int8_t>(!isBogus());
4268 srcText.pinIndices(srcStart, srcLength);
4269 return doCompare(start, thisLength, srcText.getArrayStart(), srcStart, srcLength);
4274UnicodeString::doEqualsSubstring(int32_t start,
4276 const UnicodeString& srcText,
4278 int32_t srcLength)
const
4280 if(srcText.isBogus()) {
4283 srcText.pinIndices(srcStart, srcLength);
4284 return !isBogus() && doEqualsSubstring(start, thisLength, srcText.getArrayStart(), srcStart, srcLength);
4295 return !text.
isBogus() && len == textLength && doEquals(text, len);
4301{
return (!
operator==(text)); }
4305{
return doCompare(0, length(), text, 0, text.
length()) == 1; }
4309{
return doCompare(0, length(), text, 0, text.
length()) == -1; }
4313{
return doCompare(0, length(), text, 0, text.
length()) != -1; }
4317{
return doCompare(0, length(), text, 0, text.
length()) != 1; }
4321{
return doCompare(0, length(), text, 0, text.
length()); }
4362{
return doCompare(start, limit - start,
4366UnicodeString::doCompareCodePointOrder(
int32_t start,
4373 return static_cast<int8_t>(!isBogus());
4375 srcText.pinIndices(srcStart, srcLength);
4376 return doCompareCodePointOrder(start, thisLength, srcText.getArrayStart(), srcStart, srcLength);
4382{
return doCompareCodePointOrder(0, length(), text, 0, text.
length()); }
4385UnicodeString::compareCodePointOrder(
int32_t start,
4396UnicodeString::compareCodePointOrder(
int32_t start,
4404UnicodeString::compareCodePointOrder(
int32_t start,
4410UnicodeString::compareCodePointOrder(
int32_t start,
4418UnicodeString::compareCodePointOrderBetween(
int32_t start,
4423{
return doCompareCodePointOrder(start, limit - start,
4427UnicodeString::doCaseCompare(
int32_t start,
4435 return static_cast<int8_t>(!isBogus());
4437 srcText.pinIndices(srcStart, srcLength);
4438 return doCaseCompare(start, thisLength, srcText.getArrayStart(), srcStart, srcLength, options);
4444 return doCaseCompare(0, length(), text, 0, text.
length(), options);
4518{
return indexOf(text, 0, text.
length(), 0, length()); }
4524 return indexOf(text, 0, text.
length(), start, length() - start);
4549UnicodeString::indexOf(
char16_t c,
4552{
return doIndexOf(c, start,
_length); }
4558{
return doIndexOf(c, start,
_length); }
4561UnicodeString::indexOf(
char16_t c)
const
4562{
return doIndexOf(c, 0, length()); }
4566{
return indexOf(c, 0, length()); }
4569UnicodeString::indexOf(
char16_t c,
4572 return doIndexOf(c, start, length() - start);
4579 return indexOf(c, start, length() - start);
4617{
return lastIndexOf(text, 0, text.
length(), start,
_length); }
4623 return lastIndexOf(text, 0, text.
length(), start, length() - start);
4628{
return lastIndexOf(text, 0, text.
length(), 0, length()); }
4631UnicodeString::lastIndexOf(
char16_t c,
4634{
return doLastIndexOf(c, start,
_length); }
4640 return doLastIndexOf(c, start,
_length);
4644UnicodeString::lastIndexOf(
char16_t c)
const
4645{
return doLastIndexOf(c, 0, length()); }
4649 return lastIndexOf(c, 0, length());
4653UnicodeString::lastIndexOf(
char16_t c,
4656 return doLastIndexOf(c, start, length() - start);
4663 return lastIndexOf(c, start, length() - start);
4668{
return doEqualsSubstring(0, text.
length(), text, 0, text.
length()); }
4694{
return doEqualsSubstring(length() - text.
length(), text.
length(),
4695 text, 0, text.
length()); }
4768{
return doReplace(start, limit - start,
srcText, 0,
srcText.length()); }
4781{
return findAndReplace(0, length(),
oldText, 0,
oldText.length(),
4796UnicodeString::doExtract(
int32_t start,
4812{ doExtract(start,
_length, target); }
4814#if !UCONFIG_NO_CONVERSION
4841 return tempSubString(start, limit - start);
4845UnicodeString::doCharAt(
int32_t offset)
const
4848 return getArrayStart()[offset];
4850 return kInvalidUChar;
4856{
return doCharAt(offset); }
4860{
return doCharAt(offset); }
4863UnicodeString::isEmpty()
const {
4865 return (fUnion.fFields.fLengthAndFlags>>kLengthShift) == 0;
4872UnicodeString::setZeroLength() {
4873 fUnion.fFields.fLengthAndFlags &= kAllStorageFlags;
4877UnicodeString::setShortLength(int32_t len) {
4879 fUnion.fFields.fLengthAndFlags =
4880 static_cast<int16_t
>((fUnion.fFields.fLengthAndFlags & kAllStorageFlags) | (len << kLengthShift));
4884UnicodeString::setLength(int32_t len) {
4885 if(len <= kMaxShortLength) {
4886 setShortLength(len);
4888 fUnion.fFields.fLengthAndFlags |= kLengthIsLarge;
4889 fUnion.fFields.fLength = len;
4894UnicodeString::setToEmpty() {
4895 fUnion.fFields.fLengthAndFlags = kShortString;
4899UnicodeString::setArray(
char16_t *array, int32_t len, int32_t capacity) {
4901 fUnion.fFields.fArray = array;
4902 fUnion.fFields.fCapacity = capacity;
4905inline UnicodeString&
4906UnicodeString::operator= (
char16_t ch)
4907{
return doReplace(0, length(), &
ch, 0, 1); }
4911{
return replace(0, length(),
ch); }
4949 return doReplace(0, length(), &
srcChar, 0, 1);
4956 return replace(0, length(),
srcChar);
4982{
return doAppend(&
srcChar, 0, 1); }
4985UnicodeString::operator+= (
char16_t ch)
4986{
return doAppend(&
ch, 0, 1); }
5025{
return doReplace(start, 0, &
srcChar, 0, 1); }
5030{
return replace(start, 0,
srcChar); }
5034UnicodeString::remove()
5053 return doReplace(start,
_length,
nullptr, 0, 0);
5059{
return doReplace(start, limit - start,
nullptr, 0, 0); }
5064 return doReplace(0, start,
nullptr, 0, 0);
5083UnicodeString::reverse()
5084{
return doReverse(0, length()); }
5089{
return doReverse(start,
_length); }
C++ API: Interface for writing bytes, and implementation classes.
C++ API: char16_t pointer wrappers with implicit conversion from bit-compatible raw pointer types.
#define U_ALIASING_BARRIER(ptr)
Barrier for pointer anti-aliasing optimizations even across function boundaries.
The BreakIterator class implements methods for finding the location of boundaries in text.
A ByteSink can be filled with bytes.
char16_t * wrapper with implicit conversion from distinct but bit-compatible pointer types.
const char16_t * wrapper with implicit conversion from distinct but bit-compatible pointer types.
Records lengths of string edits but not replacement text.
"Smart pointer" base class; do not use directly: use LocalPointer etc.
A Locale object represents a specific geographical, political, or cultural region.
Replaceable is an abstract base class representing a string of characters that supports the replaceme...
virtual void extractBetween(int32_t start, int32_t limit, UnicodeString &target) const =0
Copies characters in the range [start, limit) into the UnicodeString target.
char16_t charAt(int32_t offset) const
Returns the 16-bit code unit at the given offset into the text.
int32_t length() const
Returns the number of 16-bit code units in the text.
A string-like object that points to a sized piece of memory.
UnicodeString is a string class that stores Unicode characters directly and provides similar function...
int32_t indexOf(const char16_t *srcChars, int32_t srcStart, int32_t srcLength, int32_t start, int32_t length) const
Locate in this the first occurrence in the range [start, start + length) of the characters in srcChar...
UnicodeString(const UnicodeString &that)
Copy constructor.
void swap(UnicodeString &other) noexcept
Swap strings.
virtual char16_t getCharAt(int32_t offset) const override
The change in Replaceable to use virtual getCharAt() allows UnicodeString::charAt() to be inline agai...
bool operator==(const S &text) const
Equality operator.
virtual int32_t getLength() const override
Implement Replaceable::getLength() (see jitterbug 1027).
UnicodeString & setTo(char16_t *buffer, int32_t buffLength, int32_t buffCapacity)
Aliasing setTo() function, analogous to the writable-aliasing char16_t* constructor.
UnicodeString & operator=(const S &src)
Assignment operator.
UnicodeString & operator=(UnicodeString &&src) noexcept
Move assignment operator; might leave src in bogus state.
UChar32 unescapeAt(int32_t &offset) const
Unescape a single escape sequence and return the represented character.
UnicodeString(const wchar_t *text, int32_t textLength)
wchar_t * constructor.
virtual void handleReplaceBetween(int32_t start, int32_t limit, const UnicodeString &text) override
Replace a substring of this object with the given text.
UBool hasMoreChar32Than(int32_t start, int32_t length, int32_t number) const
Check if the length char16_t code units of the string contain more Unicode code points than a certain...
UnicodeString(const UnicodeString &src, int32_t srcStart, int32_t srcLength)
'Substring' constructor from subrange of source string.
virtual ~UnicodeString()
Destructor.
UnicodeString(const char *codepageData, int32_t dataLength, const char *codepage)
char* constructor.
UnicodeString(const char *codepageData, const char *codepage)
char* constructor.
UnicodeString(UBool isTerminated, ConstChar16Ptr text, int32_t textLength)
Readonly-aliasing char16_t* constructor.
static UnicodeString readOnlyAlias(const UnicodeString &text)
Readonly-aliasing factory method.
UnicodeString & toTitle(BreakIterator *titleIter, const Locale &locale, uint32_t options)
Titlecase this string, with options.
UnicodeString & append(UChar32 srcChar)
Append the code point srcChar to the UnicodeString object.
EInvariant
Constant to be used in the UnicodeString(char *, int32_t, EInvariant) constructor which constructs a ...
bool operator!=(const S &text) const
Inequality operator.
UnicodeString unescape() const
Unescape a string of characters and return a string containing the result.
UnicodeString(const UnicodeString &src, int32_t srcStart)
'Substring' constructor from tail of source string.
int32_t getChar32Limit(int32_t offset) const
Adjust a random-access offset so that it points behind a Unicode character.
UnicodeString(char16_t *buffer, int32_t buffLength, int32_t buffCapacity)
Writable-aliasing char16_t* constructor.
UnicodeString & findAndReplace(int32_t start, int32_t length, const UnicodeString &oldText, int32_t oldStart, int32_t oldLength, const UnicodeString &newText, int32_t newStart, int32_t newLength)
Replace all occurrences of characters in oldText in the range [oldStart, oldStart + oldLength) with t...
UnicodeString(int32_t capacity, UChar32 c, int32_t count)
Construct a UnicodeString with capacity to hold capacity char16_ts.
UnicodeString & operator+=(const S &src)
Append operator.
int32_t extract(int32_t start, int32_t startLength, char *target, uint32_t targetLength, const char *codepage) const
Copy the characters in the range [start, start + length) into an array of characters in a specified c...
virtual void copy(int32_t start, int32_t limit, int32_t dest) override
Copy a substring of this object, retaining attribute (out-of-band) information.
virtual void extractBetween(int32_t start, int32_t limit, UnicodeString &target) const override
Copy the characters in the range [start, limit) into the UnicodeString target.
UnicodeString & replace(int32_t start, int32_t length, const UnicodeString &srcText, int32_t srcStart, int32_t srcLength)
Replace the characters in the range [start, start + length) with the characters in srcText in the ran...
UnicodeString & toTitle(BreakIterator *titleIter)
Titlecase this string, convenience function using the default locale.
UnicodeString & fastCopyFrom(const UnicodeString &src)
Almost the same as the assignment operator.
virtual UnicodeString * clone() const override
Clone this object, an instance of a subclass of Replaceable.
UBool padLeading(int32_t targetLength, char16_t padChar=0x0020)
Pad the start of this UnicodeString with the character padChar.
int32_t getChar32Start(int32_t offset) const
Adjust a random-access offset so that it points to the beginning of a Unicode character.
UnicodeString & append(const S &src)
Appends the characters in src which is, or which is implicitly convertible to, a std::u16string_view ...
UChar32 char32At(int32_t offset) const
Return the code point that contains the code unit at offset offset.
UnicodeString(const char *src, int32_t textLength, enum EInvariant inv)
Constructs a Unicode string from an invariant-character char * string.
UnicodeString tempSubString(int32_t start=0, int32_t length=INT32_MAX) const
Create a temporary substring for the specified range.
int32_t extract(Char16Ptr dest, int32_t destCapacity, UErrorCode &errorCode) const
Copy the contents of the string into dest.
int32_t length() const
Return the length of the UnicodeString object.
virtual UChar32 getChar32At(int32_t offset) const override
The change in Replaceable to use virtual getChar32At() allows UnicodeString::char32At() to be inline ...
int32_t extract(int32_t start, int32_t startLength, char *target, uint32_t targetLength) const
Copy the characters in the range [start, start + length) into an array of characters in the platform'...
static UnicodeString fromUTF8(StringPiece utf8)
Create a UnicodeString from a UTF-8 string.
UNISTR_FROM_CHAR_EXPLICIT UnicodeString(char16_t ch)
Single char16_t (code unit) constructor.
int32_t lastIndexOf(const char16_t *srcChars, int32_t srcStart, int32_t srcLength, int32_t start, int32_t length) const
Locate in this the last occurrence in the range [start, start + length) of the characters in srcChars...
UnicodeString(wchar_t *buffer, int32_t buffLength, int32_t buffCapacity)
Writable-aliasing wchar_t * constructor.
void setToBogus()
Make this UnicodeString object invalid.
friend void swap(UnicodeString &s1, UnicodeString &s2) noexcept
Non-member UnicodeString swap function.
int32_t moveIndex32(int32_t index, int32_t delta) const
Move the code unit index along the string by delta code points.
static UnicodeString fromUTF32(const UChar32 *utf32, int32_t length)
Create a UnicodeString from a UTF-32 string.
UnicodeString & replace(int32_t start, int32_t length, UChar32 srcChar)
Replace the characters in the range [start, start + length) with the code point srcChar.
UNISTR_FROM_STRING_EXPLICIT UnicodeString(const S &text)
Constructor from text which is, or which is implicitly convertible to, a std::u16string_view or (if U...
int32_t countChar32(int32_t start=0, int32_t length=INT32_MAX) const
Count Unicode code points in the length char16_t code units of the string.
UNISTR_FROM_CHAR_EXPLICIT UnicodeString(UChar32 ch)
Single UChar32 (code point) constructor.
static UnicodeString readOnlyAlias(const S &text)
Readonly-aliasing factory method.
UnicodeString & trim()
Trims leading and trailing whitespace from this UnicodeString.
UnicodeString & operator=(const UnicodeString &srcText)
Assignment operator.
UnicodeString & setTo(UBool isTerminated, ConstChar16Ptr text, int32_t textLength)
Aliasing setTo() function, analogous to the readonly-aliasing char16_t* constructor.
int32_t extract(char *dest, int32_t destCapacity, UConverter *cnv, UErrorCode &errorCode) const
Convert the UnicodeString into a codepage string using an existing UConverter.
StringClass & toUTF8String(StringClass &result) const
Convert the UnicodeString to UTF-8 and append the result to a standard string.
UnicodeString(UnicodeString &&src) noexcept
Move constructor; might leave src in bogus state.
UnicodeString & toUpper()
Convert the characters in this to UPPER CASE following the conventions of the default locale.
UnicodeString(const char16_t *text, int32_t textLength)
char16_t* constructor.
UnicodeString(const char *src, int32_t srcLength, UConverter *cnv, UErrorCode &errorCode)
char * / UConverter constructor.
UnicodeString(const char *codepageData, int32_t dataLength)
char* constructor.
static UClassID getStaticClassID()
ICU "poor man's RTTI", returns a UClassID for this class.
UnicodeString(uint16_t *buffer, int32_t buffLength, int32_t buffCapacity)
Writable-aliasing uint16_t * constructor.
int32_t toUTF32(UChar32 *utf32, int32_t capacity, UErrorCode &errorCode) const
Convert the UnicodeString to UTF-32.
UBool isBogus() const
Determine if this object contains a valid string.
UnicodeString & toLower(const Locale &locale)
Convert the characters in this to lower case following the conventions of a specific locale.
UnicodeString & toTitle(BreakIterator *titleIter, const Locale &locale)
Titlecase this string.
UnicodeString & foldCase(uint32_t options=0)
Case-folds the characters in this string.
const char16_t * getTerminatedBuffer()
Get a read-only pointer to the internal buffer, making sure that it is NUL-terminated.
UnicodeString(const uint16_t *text, int32_t textLength)
uint16_t * constructor.
UnicodeString & toUpper(const Locale &locale)
Convert the characters in this to UPPER CASE following the conventions of a specific locale.
UnicodeString & setCharAt(int32_t offset, char16_t ch)
Set the character at the specified offset to the specified character.
virtual UClassID getDynamicClassID() const override
ICU "poor man's RTTI", returns a UClassID for the actual class.
int32_t extract(int32_t start, int32_t startLength, char *target, int32_t targetCapacity, enum EInvariant inv) const
Copy the characters in the range [start, start + startLength) into an array of characters.
char16_t * getBuffer(int32_t minCapacity)
Get a read/write pointer to the internal buffer.
UnicodeString & toLower()
Convert the characters in this to lower case following the conventions of the default locale.
UBool padTrailing(int32_t targetLength, char16_t padChar=0x0020)
Pad the end of this UnicodeString with the character padChar.
UNISTR_FROM_STRING_EXPLICIT UnicodeString(const char *codepageData)
char* constructor.
void releaseBuffer(int32_t newLength=-1)
Release a read/write buffer on a UnicodeString object with an "open" getBuffer(minCapacity).
void toUTF8(ByteSink &sink) const
Convert the UnicodeString to UTF-8 and write the result to a ByteSink.
virtual UBool hasMetaData() const override
Replaceable API.
U_CAPI int32_t u_strlen(const UChar *s)
U_EXPORT UBool operator==(const StringPiece &x, const StringPiece &y)
Global operator == for StringPiece.
U_COMMON_API UnicodeString unistr_internalConcat(const UnicodeString &s1, std::u16string_view s2)
bool operator!=(const StringPiece &x, const StringPiece &y)
Global operator != for StringPiece.
U_COMMON_API UnicodeString operator+(const UnicodeString &s1, const UnicodeString &s2)
Creates a new UnicodeString from the concatenation of two others.
const UChar * toUCharPtr(const char16_t *p)
Converts from const char16_t * to const UChar *.
C++ API: Replaceable String.
C++ API: Central ICU header for including the C++ standard <string> header and for related definition...
C++ API: StringPiece: Read-only byte string wrapper class.
struct UConverter UConverter
#define UCONFIG_NO_BREAK_ITERATION
This switch turns off break iteration.
int32_t UChar32
Define UChar32 as a type for single Unicode code points.
#define INT32_MAX
The largest value a 32 bit signed integer can hold.
int8_t UBool
The ICU boolean type, a signed-byte integer.
#define U_CAPI
This is used to declare a function as a public ICU C API.
char16_t UChar
The base type for UTF-16 code units and pointers.
#define U_SIZEOF_UCHAR
Number of bytes in a UChar (always 2).
#define UNISTR_FROM_CHAR_EXPLICIT
This can be defined to be empty or "explicit".
int32_t UStringCaseMapper(int32_t caseLocale, uint32_t options, icu::BreakIterator *iter, char16_t *dest, int32_t destCapacity, const char16_t *src, int32_t srcLength, icu::Edits *edits, UErrorCode &errorCode)
Internal string case mapping function type.
#define UNISTR_FROM_STRING_EXPLICIT
This can be defined to be empty or "explicit".
#define UNISTR_OBJECT_SIZE
Desired sizeof(UnicodeString) in bytes.
void * UClassID
UClassID is used to identify classes without using the compiler's RTTI.
Basic definitions for ICU, for both C and C++ APIs.
UErrorCode
Standard ICU4C error code type, a substitute for exceptions.
#define U_COMMON_API
Set to export library symbols from inside the common library, and to import them from outside.