/* ============================================================================== This file is part of the JUCE library - "Jules' Utility Class Extensions" Copyright 2004-11 by Raw Material Software Ltd. ------------------------------------------------------------------------------ JUCE can be redistributed and/or modified under the terms of the GNU General Public License (Version 2), as published by the Free Software Foundation. A copy of the license is included in the JUCE distribution, or can be found online at www.gnu.org/licenses. JUCE is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. ------------------------------------------------------------------------------ To release a closed-source product which uses JUCE, commercial licenses are available: visit www.rawmaterialsoftware.com/juce for more information. ============================================================================== */ #ifndef __JUCE_CHARACTERFUNCTIONS_JUCEHEADER__ #define __JUCE_CHARACTERFUNCTIONS_JUCEHEADER__ //============================================================================== #if JUCE_WINDOWS && ! DOXYGEN #define JUCE_NATIVE_WCHAR_IS_UTF8 0 #define JUCE_NATIVE_WCHAR_IS_UTF16 1 #define JUCE_NATIVE_WCHAR_IS_UTF32 0 #else /** This macro will be set to 1 if the compiler's native wchar_t is an 8-bit type. */ #define JUCE_NATIVE_WCHAR_IS_UTF8 0 /** This macro will be set to 1 if the compiler's native wchar_t is a 16-bit type. */ #define JUCE_NATIVE_WCHAR_IS_UTF16 0 /** This macro will be set to 1 if the compiler's native wchar_t is a 32-bit type. */ #define JUCE_NATIVE_WCHAR_IS_UTF32 1 #endif #if JUCE_NATIVE_WCHAR_IS_UTF32 || DOXYGEN /** A platform-independent 32-bit unicode character type. */ typedef wchar_t juce_wchar; #else typedef uint32 juce_wchar; #endif #ifndef DOXYGEN /** This macro is deprecated, but preserved for compatibility with old code. */ #define JUCE_T(stringLiteral) (L##stringLiteral) #endif #if JUCE_DEFINE_T_MACRO /** The 'T' macro is an alternative for using the "L" prefix in front of a string literal. This macro is deprecated, but available for compatibility with old code if you set JUCE_DEFINE_T_MACRO = 1. The fastest, most portable and best way to write your string literals is as standard char strings, using escaped utf-8 character sequences for extended characters, rather than trying to store them as wide-char strings. */ #define T(stringLiteral) JUCE_T(stringLiteral) #endif //============================================================================== /** A collection of functions for manipulating characters and character strings. Most of these methods are designed for internal use by the String and CharPointer classes, but some of them may be useful to call directly. @see String, CharPointer_UTF8, CharPointer_UTF16, CharPointer_UTF32 */ class JUCE_API CharacterFunctions { public: //============================================================================== /** Converts a character to upper-case. */ static juce_wchar toUpperCase (juce_wchar character) noexcept; /** Converts a character to lower-case. */ static juce_wchar toLowerCase (juce_wchar character) noexcept; /** Checks whether a unicode character is upper-case. */ static bool isUpperCase (juce_wchar character) noexcept; /** Checks whether a unicode character is lower-case. */ static bool isLowerCase (juce_wchar character) noexcept; /** Checks whether a character is whitespace. */ static bool isWhitespace (char character) noexcept; /** Checks whether a character is whitespace. */ static bool isWhitespace (juce_wchar character) noexcept; /** Checks whether a character is a digit. */ static bool isDigit (char character) noexcept; /** Checks whether a character is a digit. */ static bool isDigit (juce_wchar character) noexcept; /** Checks whether a character is alphabetic. */ static bool isLetter (char character) noexcept; /** Checks whether a character is alphabetic. */ static bool isLetter (juce_wchar character) noexcept; /** Checks whether a character is alphabetic or numeric. */ static bool isLetterOrDigit (char character) noexcept; /** Checks whether a character is alphabetic or numeric. */ static bool isLetterOrDigit (juce_wchar character) noexcept; /** Returns 0 to 16 for '0' to 'F", or -1 for characters that aren't a legal hex digit. */ static int getHexDigitValue (juce_wchar digit) noexcept; //============================================================================== /** Parses a character string to read a floating-point number. Note that this will advance the pointer that is passed in, leaving it at the end of the number. */ template static double readDoubleValue (CharPointerType& text) noexcept { double result[3] = { 0 }, accumulator[2] = { 0 }; int exponentAdjustment[2] = { 0 }, exponentAccumulator[2] = { -1, -1 }; int exponent = 0, decPointIndex = 0, digit = 0; int lastDigit = 0, numSignificantDigits = 0; bool isNegative = false, digitsFound = false; const int maxSignificantDigits = 15 + 2; text = text.findEndOfWhitespace(); juce_wchar c = *text; switch (c) { case '-': isNegative = true; // fall-through.. case '+': c = *++text; } switch (c) { case 'n': case 'N': if ((text[1] == 'a' || text[1] == 'A') && (text[2] == 'n' || text[2] == 'N')) return std::numeric_limits::quiet_NaN(); break; case 'i': case 'I': if ((text[1] == 'n' || text[1] == 'N') && (text[2] == 'f' || text[2] == 'F')) return std::numeric_limits::infinity(); break; } for (;;) { if (text.isDigit()) { lastDigit = digit; digit = (int) text.getAndAdvance() - '0'; digitsFound = true; if (decPointIndex != 0) exponentAdjustment[1]++; if (numSignificantDigits == 0 && digit == 0) continue; if (++numSignificantDigits > maxSignificantDigits) { if (digit > 5) ++accumulator [decPointIndex]; else if (digit == 5 && (lastDigit & 1) != 0) ++accumulator [decPointIndex]; if (decPointIndex > 0) exponentAdjustment[1]--; else exponentAdjustment[0]++; while (text.isDigit()) { ++text; if (decPointIndex == 0) exponentAdjustment[0]++; } } else { const double maxAccumulatorValue = (double) ((std::numeric_limits::max() - 9) / 10); if (accumulator [decPointIndex] > maxAccumulatorValue) { result [decPointIndex] = mulexp10 (result [decPointIndex], exponentAccumulator [decPointIndex]) + accumulator [decPointIndex]; accumulator [decPointIndex] = 0; exponentAccumulator [decPointIndex] = 0; } accumulator [decPointIndex] = accumulator[decPointIndex] * 10 + digit; exponentAccumulator [decPointIndex]++; } } else if (decPointIndex == 0 && *text == '.') { ++text; decPointIndex = 1; if (numSignificantDigits > maxSignificantDigits) { while (text.isDigit()) ++text; break; } } else { break; } } result[0] = mulexp10 (result[0], exponentAccumulator[0]) + accumulator[0]; if (decPointIndex != 0) result[1] = mulexp10 (result[1], exponentAccumulator[1]) + accumulator[1]; c = *text; if ((c == 'e' || c == 'E') && digitsFound) { bool negativeExponent = false; switch (*++text) { case '-': negativeExponent = true; // fall-through.. case '+': ++text; } while (text.isDigit()) exponent = (exponent * 10) + ((int) text.getAndAdvance() - '0'); if (negativeExponent) exponent = -exponent; } double r = mulexp10 (result[0], exponent + exponentAdjustment[0]); if (decPointIndex != 0) r += mulexp10 (result[1], exponent - exponentAdjustment[1]); return isNegative ? -r : r; } /** Parses a character string, to read a floating-point value. */ template static double getDoubleValue (CharPointerType text) noexcept { return readDoubleValue (text); } //============================================================================== /** Parses a character string, to read an integer value. */ template static IntType getIntValue (const CharPointerType& text) noexcept { IntType v = 0; CharPointerType s (text.findEndOfWhitespace()); const bool isNeg = *s == '-'; if (isNeg) ++s; for (;;) { const juce_wchar c = s.getAndAdvance(); if (c >= '0' && c <= '9') v = v * 10 + (IntType) (c - '0'); else break; } return isNeg ? -v : v; } //============================================================================== /** Counts the number of characters in a given string, stopping if the count exceeds a specified limit. */ template static size_t lengthUpTo (CharPointerType text, const size_t maxCharsToCount) noexcept { size_t len = 0; while (len < maxCharsToCount && text.getAndAdvance() != 0) ++len; return len; } /** Counts the number of characters in a given string, stopping if the count exceeds a specified end-pointer. */ template static size_t lengthUpTo (CharPointerType start, const CharPointerType& end) noexcept { size_t len = 0; while (start < end && start.getAndAdvance() != 0) ++len; return len; } /** Copies null-terminated characters from one string to another. */ template static void copyAll (DestCharPointerType& dest, SrcCharPointerType src) noexcept { for (;;) { const juce_wchar c = src.getAndAdvance(); if (c == 0) break; dest.write (c); } dest.writeNull(); } /** Copies characters from one string to another, up to a null terminator or a given byte size limit. */ template static int copyWithDestByteLimit (DestCharPointerType& dest, SrcCharPointerType src, int maxBytes) noexcept { typename DestCharPointerType::CharType const* const startAddress = dest.getAddress(); maxBytes -= sizeof (typename DestCharPointerType::CharType); // (allow for a terminating null) for (;;) { const juce_wchar c = src.getAndAdvance(); const int bytesNeeded = (int) DestCharPointerType::getBytesRequiredFor (c); maxBytes -= bytesNeeded; if (c == 0 || maxBytes < 0) break; dest.write (c); } dest.writeNull(); return (int) (getAddressDifference (dest.getAddress(), startAddress) + sizeof (typename DestCharPointerType::CharType)); } /** Copies characters from one string to another, up to a null terminator or a given maximum number of characters. */ template static void copyWithCharLimit (DestCharPointerType& dest, SrcCharPointerType src, int maxChars) noexcept { while (--maxChars > 0) { const juce_wchar c = src.getAndAdvance(); if (c == 0) break; dest.write (c); } dest.writeNull(); } /** Compares two null-terminated character strings. */ template static int compare (CharPointerType1 s1, CharPointerType2 s2) noexcept { for (;;) { const int c1 = (int) s1.getAndAdvance(); const int c2 = (int) s2.getAndAdvance(); const int diff = c1 - c2; if (diff != 0) return diff < 0 ? -1 : 1; else if (c1 == 0) break; } return 0; } /** Compares two null-terminated character strings, up to a given number of characters. */ template static int compareUpTo (CharPointerType1 s1, CharPointerType2 s2, int maxChars) noexcept { while (--maxChars >= 0) { const int c1 = (int) s1.getAndAdvance(); const int c2 = (int) s2.getAndAdvance(); const int diff = c1 - c2; if (diff != 0) return diff < 0 ? -1 : 1; else if (c1 == 0) break; } return 0; } /** Compares two null-terminated character strings, using a case-independant match. */ template static int compareIgnoreCase (CharPointerType1 s1, CharPointerType2 s2) noexcept { for (;;) { int c1 = (int) s1.toUpperCase(); int c2 = (int) s2.toUpperCase(); ++s1; ++s2; const int diff = c1 - c2; if (diff != 0) return diff < 0 ? -1 : 1; else if (c1 == 0) break; } return 0; } /** Compares two null-terminated character strings, using a case-independent match. */ template static int compareIgnoreCaseUpTo (CharPointerType1 s1, CharPointerType2 s2, int maxChars) noexcept { while (--maxChars >= 0) { int c1 = s1.toUpperCase(); int c2 = s2.toUpperCase(); ++s1; ++s2; const int diff = c1 - c2; if (diff != 0) return diff < 0 ? -1 : 1; else if (c1 == 0) break; } return 0; } /** Finds the character index of a given substring in another string. Returns -1 if the substring is not found. */ template static int indexOf (CharPointerType1 haystack, const CharPointerType2& needle) noexcept { int index = 0; const int needleLength = (int) needle.length(); for (;;) { if (haystack.compareUpTo (needle, needleLength) == 0) return index; if (haystack.getAndAdvance() == 0) return -1; ++index; } } /** Finds the character index of a given substring in another string, using a case-independent match. Returns -1 if the substring is not found. */ template static int indexOfIgnoreCase (CharPointerType1 haystack, const CharPointerType2& needle) noexcept { int index = 0; const int needleLength = (int) needle.length(); for (;;) { if (haystack.compareIgnoreCaseUpTo (needle, needleLength) == 0) return index; if (haystack.getAndAdvance() == 0) return -1; ++index; } } /** Finds the character index of a given character in another string. Returns -1 if the character is not found. */ template static int indexOfChar (Type text, const juce_wchar charToFind) noexcept { int i = 0; while (! text.isEmpty()) { if (text.getAndAdvance() == charToFind) return i; ++i; } return -1; } /** Finds the character index of a given character in another string, using a case-independent match. Returns -1 if the character is not found. */ template static int indexOfCharIgnoreCase (Type text, juce_wchar charToFind) noexcept { charToFind = CharacterFunctions::toLowerCase (charToFind); int i = 0; while (! text.isEmpty()) { if (text.toLowerCase() == charToFind) return i; ++text; ++i; } return -1; } /** Returns a pointer to the first non-whitespace character in a string. If the string contains only whitespace, this will return a pointer to its null terminator. */ template static Type findEndOfWhitespace (const Type& text) noexcept { Type p (text); while (p.isWhitespace()) ++p; return p; } /** Returns a pointer to the first character in the string which is found in the breakCharacters string. */ template static Type findEndOfToken (const Type& text, const Type& breakCharacters, const Type& quoteCharacters) { Type t (text); juce_wchar currentQuoteChar = 0; while (! t.isEmpty()) { const juce_wchar c = t.getAndAdvance(); if (currentQuoteChar == 0 && breakCharacters.indexOf (c) >= 0) { --t; break; } if (quoteCharacters.indexOf (c) >= 0) { if (currentQuoteChar == 0) currentQuoteChar = c; else if (currentQuoteChar == c) currentQuoteChar = 0; } } return t; } private: static double mulexp10 (const double value, int exponent) noexcept; }; #endif // __JUCE_CHARACTERFUNCTIONS_JUCEHEADER__