//------------------------------------------------------------------------------ /* This file is part of Beast: https://github.com/vinniefalco/Beast Copyright 2013, Vinnie Falco Portions of this file are from JUCE. Copyright (c) 2013 - Raw Material Software Ltd. Please visit http://www.juce.com Permission to use, copy, modify, and/or distribute this software for any purpose with or without fee is hereby granted, provided that the above copyright notice and this permission notice appear in all copies. THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY SPECIAL , DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */ //============================================================================== #ifndef BEAST_CHARPOINTER_UTF32_H_INCLUDED #define BEAST_CHARPOINTER_UTF32_H_INCLUDED #include #include #include #include namespace beast { //============================================================================== /** Wraps a pointer to a null-terminated UTF-32 character string, and provides various methods to operate on the data. @see CharPointer_UTF8, CharPointer_UTF16 */ class CharPointer_UTF32 { public: typedef beast_wchar CharType; inline explicit CharPointer_UTF32 (const CharType* const rawPointer) noexcept : data (const_cast (rawPointer)) { } inline CharPointer_UTF32 (const CharPointer_UTF32& other) noexcept : data (other.data) { } inline CharPointer_UTF32 operator= (CharPointer_UTF32 other) noexcept { data = other.data; return *this; } inline CharPointer_UTF32 operator= (const CharType* text) noexcept { data = const_cast (text); return *this; } /** This is a pointer comparison, it doesn't compare the actual text. */ inline bool operator== (CharPointer_UTF32 other) const noexcept { return data == other.data; } inline bool operator!= (CharPointer_UTF32 other) const noexcept { return data != other.data; } inline bool operator<= (CharPointer_UTF32 other) const noexcept { return data <= other.data; } inline bool operator< (CharPointer_UTF32 other) const noexcept { return data < other.data; } inline bool operator>= (CharPointer_UTF32 other) const noexcept { return data >= other.data; } inline bool operator> (CharPointer_UTF32 other) const noexcept { return data > other.data; } /** Returns the address that this pointer is pointing to. */ inline CharType* getAddress() const noexcept { return data; } /** Returns the address that this pointer is pointing to. */ inline operator const CharType*() const noexcept { return data; } /** Returns true if this pointer is pointing to a null character. */ inline bool isEmpty() const noexcept { return *data == 0; } /** Returns the unicode character that this pointer is pointing to. */ inline beast_wchar operator*() const noexcept { return *data; } /** Moves this pointer along to the next character in the string. */ inline CharPointer_UTF32 operator++() noexcept { ++data; return *this; } /** Moves this pointer to the previous character in the string. */ inline CharPointer_UTF32 operator--() noexcept { --data; return *this; } /** Returns the character that this pointer is currently pointing to, and then advances the pointer to point to the next character. */ inline beast_wchar getAndAdvance() noexcept { return *data++; } /** Moves this pointer along to the next character in the string. */ CharPointer_UTF32 operator++ (int) noexcept { CharPointer_UTF32 temp (*this); ++data; return temp; } /** Moves this pointer forwards by the specified number of characters. */ inline void operator+= (const int numToSkip) noexcept { data += numToSkip; } inline void operator-= (const int numToSkip) noexcept { data -= numToSkip; } /** Returns the character at a given character index from the start of the string. */ inline beast_wchar& operator[] (const int characterIndex) const noexcept { return data [characterIndex]; } /** Returns a pointer which is moved forwards from this one by the specified number of characters. */ CharPointer_UTF32 operator+ (const int numToSkip) const noexcept { return CharPointer_UTF32 (data + numToSkip); } /** Returns a pointer which is moved backwards from this one by the specified number of characters. */ CharPointer_UTF32 operator- (const int numToSkip) const noexcept { return CharPointer_UTF32 (data - numToSkip); } /** Writes a unicode character to this string, and advances this pointer to point to the next position. */ inline void write (const beast_wchar charToWrite) noexcept { *data++ = charToWrite; } inline void replaceChar (const beast_wchar newChar) noexcept { *data = newChar; } /** Writes a null character to this string (leaving the pointer's position unchanged). */ inline void writeNull() const noexcept { *data = 0; } /** Returns the number of characters in this string. */ size_t length() const noexcept { #if BEAST_NATIVE_WCHAR_IS_UTF32 && ! BEAST_ANDROID return wcslen (data); #else size_t n = 0; while (data[n] != 0) ++n; return n; #endif } /** Returns the number of characters in this string, or the given value, whichever is lower. */ size_t lengthUpTo (const size_t maxCharsToCount) const noexcept { return CharacterFunctions::lengthUpTo (*this, maxCharsToCount); } /** Returns the number of characters in this string, or up to the given end pointer, whichever is lower. */ size_t lengthUpTo (const CharPointer_UTF32 end) const noexcept { return CharacterFunctions::lengthUpTo (*this, end); } /** Returns the number of bytes that are used to represent this string. This includes the terminating null character. */ size_t sizeInBytes() const noexcept { return sizeof (CharType) * (length() + 1); } /** Returns the number of bytes that would be needed to represent the given unicode character in this encoding format. */ static inline size_t getBytesRequiredFor (const beast_wchar) noexcept { return sizeof (CharType); } /** Returns the number of bytes that would be needed to represent the given string in this encoding format. The value returned does NOT include the terminating null character. */ template static size_t getBytesRequiredFor (const CharPointer text) noexcept { return sizeof (CharType) * text.length(); } /** Returns a pointer to the null character that terminates this string. */ CharPointer_UTF32 findTerminatingNull() const noexcept { return CharPointer_UTF32 (data + length()); } /** Copies a source string to this pointer, advancing this pointer as it goes. */ template void writeAll (const CharPointer src) noexcept { CharacterFunctions::copyAll (*this, src); } /** Copies a source string to this pointer, advancing this pointer as it goes. */ void writeAll (const CharPointer_UTF32 src) noexcept { const CharType* s = src.data; while ((*data = *s) != 0) { ++data; ++s; } } /** Copies a source string to this pointer, advancing this pointer as it goes. The maxDestBytes parameter specifies the maximum number of bytes that can be written to the destination buffer before stopping. */ template size_t writeWithDestByteLimit (const CharPointer src, const size_t maxDestBytes) noexcept { return CharacterFunctions::copyWithDestByteLimit (*this, src, maxDestBytes); } /** Copies a source string to this pointer, advancing this pointer as it goes. The maxChars parameter specifies the maximum number of characters that can be written to the destination buffer before stopping (including the terminating null). */ template void writeWithCharLimit (const CharPointer src, const int maxChars) noexcept { CharacterFunctions::copyWithCharLimit (*this, src, maxChars); } /** Compares this string with another one. */ template int compare (const CharPointer other) const noexcept { return CharacterFunctions::compare (*this, other); } #if BEAST_NATIVE_WCHAR_IS_UTF32 && ! BEAST_ANDROID /** Compares this string with another one. */ int compare (const CharPointer_UTF32 other) const noexcept { return wcscmp (data, other.data); } #endif /** Compares this string with another one, up to a specified number of characters. */ template int compareUpTo (const CharPointer other, const int maxChars) const noexcept { return CharacterFunctions::compareUpTo (*this, other, maxChars); } /** Compares this string with another one. */ template int compareIgnoreCase (const CharPointer other) const { return CharacterFunctions::compareIgnoreCase (*this, other); } /** Compares this string with another one, up to a specified number of characters. */ template int compareIgnoreCaseUpTo (const CharPointer other, const int maxChars) const noexcept { return CharacterFunctions::compareIgnoreCaseUpTo (*this, other, maxChars); } /** Returns the character index of a substring, or -1 if it isn't found. */ template int indexOf (const CharPointer stringToFind) const noexcept { return CharacterFunctions::indexOf (*this, stringToFind); } /** Returns the character index of a unicode character, or -1 if it isn't found. */ int indexOf (const beast_wchar charToFind) const noexcept { int i = 0; while (data[i] != 0) { if (data[i] == charToFind) return i; ++i; } return -1; } /** Returns the character index of a unicode character, or -1 if it isn't found. */ int indexOf (const beast_wchar charToFind, const bool ignoreCase) const noexcept { return ignoreCase ? CharacterFunctions::indexOfCharIgnoreCase (*this, charToFind) : CharacterFunctions::indexOfChar (*this, charToFind); } /** Returns true if the first character of this string is whitespace. */ bool isWhitespace() const { return CharacterFunctions::isWhitespace (*data) != 0; } /** Returns true if the first character of this string is a digit. */ bool isDigit() const { return CharacterFunctions::isDigit (*data) != 0; } /** Returns true if the first character of this string is a letter. */ bool isLetter() const { return CharacterFunctions::isLetter (*data) != 0; } /** Returns true if the first character of this string is a letter or digit. */ bool isLetterOrDigit() const { return CharacterFunctions::isLetterOrDigit (*data) != 0; } /** Returns true if the first character of this string is upper-case. */ bool isUpperCase() const { return CharacterFunctions::isUpperCase (*data) != 0; } /** Returns true if the first character of this string is lower-case. */ bool isLowerCase() const { return CharacterFunctions::isLowerCase (*data) != 0; } /** Returns an upper-case version of the first character of this string. */ beast_wchar toUpperCase() const noexcept { return CharacterFunctions::toUpperCase (*data); } /** Returns a lower-case version of the first character of this string. */ beast_wchar toLowerCase() const noexcept { return CharacterFunctions::toLowerCase (*data); } /** Parses this string as a 32-bit integer. */ int getIntValue32() const noexcept { return CharacterFunctions::getIntValue (*this); } /** Parses this string as a 64-bit integer. */ std::int64_t getIntValue64() const noexcept { return CharacterFunctions::getIntValue (*this); } /** Parses this string as a floating point double. */ double getDoubleValue() const noexcept { return CharacterFunctions::getDoubleValue (*this); } /** Returns the first non-whitespace character in the string. */ CharPointer_UTF32 findEndOfWhitespace() const noexcept { return CharacterFunctions::findEndOfWhitespace (*this); } /** Returns true if the given unicode character can be represented in this encoding. */ static bool canRepresent (beast_wchar character) noexcept { return ((unsigned int) character) < (unsigned int) 0x10ffff; } /** Returns true if this data contains a valid string in this encoding. */ static bool isValidString (const CharType* dataToTest, int maxBytesToRead) { maxBytesToRead /= sizeof (CharType); while (--maxBytesToRead >= 0 && *dataToTest != 0) if (! canRepresent (*dataToTest++)) return false; return true; } /** Atomically swaps this pointer for a new value, returning the previous value. */ CharPointer_UTF32 atomicSwap (const CharPointer_UTF32 newValue) { return CharPointer_UTF32 (reinterpret_cast &> (data).exchange (newValue.data)); } private: CharType* data; }; } #endif