Rename beast sources for consistency

2025-11-28 06:55:50 +00:00 · 2013-09-19 06:33:29 -07:00
parent 4e59ab2261
commit 34fffca202
256 changed files with 777 additions and 762 deletions
--- a/modules/beast_core/xml/XmlDocument.cpp
+++ b/modules/beast_core/xml/XmlDocument.cpp
@@ -0,0 +1,871 @@
+//------------------------------------------------------------------------------
+/*
+    This file is part of Beast: https://github.com/vinniefalco/Beast
+    Copyright 2013, Vinnie Falco <vinnie.falco@gmail.com>
+
+    Portions of this file are from JUCE.
+    Copyright (c) 2013 - Raw Material Software Ltd.
+    Please visit http://www.juce.com
+
+    Permission to use, copy, modify, and/or distribute this software for any
+    purpose  with  or without fee is hereby granted, provided that the above
+    copyright notice and this permission notice appear in all copies.
+
+    THE  SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
+    WITH  REGARD  TO  THIS  SOFTWARE  INCLUDING  ALL  IMPLIED  WARRANTIES  OF
+    MERCHANTABILITY  AND  FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
+    ANY  SPECIAL ,  DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
+    WHATSOEVER  RESULTING  FROM  LOSS  OF USE, DATA OR PROFITS, WHETHER IN AN
+    ACTION  OF  CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
+    OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
+*/
+//==============================================================================
+
+XmlDocument::XmlDocument (const String& documentText)
+    : originalText (documentText),
+      input (nullptr),
+      outOfData (false),
+      errorOccurred (false),
+      needToLoadDTD (false),
+      ignoreEmptyTextElements (true)
+{
+}
+
+XmlDocument::XmlDocument (const File& file)
+    : input (nullptr),
+      outOfData (false),
+      errorOccurred (false),
+      needToLoadDTD (false),
+      ignoreEmptyTextElements (true),
+      inputSource (new FileInputSource (file))
+{
+}
+
+XmlDocument::~XmlDocument()
+{
+}
+
+XmlElement* XmlDocument::parse (const File& file)
+{
+    XmlDocument doc (file);
+    return doc.getDocumentElement();
+}
+
+XmlElement* XmlDocument::parse (const String& xmlData)
+{
+    XmlDocument doc (xmlData);
+    return doc.getDocumentElement();
+}
+
+void XmlDocument::setInputSource (InputSource* const newSource) noexcept
+{
+    inputSource = newSource;
+}
+
+void XmlDocument::setEmptyTextElementsIgnored (const bool shouldBeIgnored) noexcept
+{
+    ignoreEmptyTextElements = shouldBeIgnored;
+}
+
+namespace XmlIdentifierChars
+{
+    static bool isIdentifierCharSlow (const beast_wchar c) noexcept
+    {
+        return CharacterFunctions::isLetterOrDigit (c)
+                 || c == '_' || c == '-' || c == ':' || c == '.';
+    }
+
+    static bool isIdentifierChar (const beast_wchar c) noexcept
+    {
+        static const uint32 legalChars[] = { 0, 0x7ff6000, 0x87fffffe, 0x7fffffe, 0 };
+
+        return ((int) c < (int) numElementsInArray (legalChars) * 32) ? ((legalChars [c >> 5] & (1 << (c & 31))) != 0)
+                                                                      : isIdentifierCharSlow (c);
+    }
+
+    /*
+    static void generateIdentifierCharConstants()
+    {
+        uint32 n[8] = { 0 };
+        for (int i = 0; i < 256; ++i)
+        if (isIdentifierCharSlow (i))
+            n[i >> 5] |= (1 << (i & 31));
+
+        String s;
+        for (int i = 0; i < 8; ++i)
+            s << "0x" << String::toHexString ((int) n[i]) << ", ";
+
+        DBG (s);
+    }
+    */
+
+    static String::CharPointerType findEndOfToken (String::CharPointerType p)
+    {
+        while (isIdentifierChar (*p))
+            ++p;
+
+        return p;
+    }
+}
+
+XmlElement* XmlDocument::getDocumentElement (const bool onlyReadOuterDocumentElement)
+{
+    if (originalText.isEmpty() && inputSource != nullptr)
+    {
+        ScopedPointer<InputStream> in (inputSource->createInputStream());
+
+        if (in != nullptr)
+        {
+            MemoryOutputStream data;
+            data.writeFromInputStream (*in, onlyReadOuterDocumentElement ? 8192 : -1);
+
+           #if BEAST_STRING_UTF_TYPE == 8
+            if (data.getDataSize() > 2)
+            {
+                data.writeByte (0);
+                const char* text = static_cast<const char*> (data.getData());
+
+                if (CharPointer_UTF16::isByteOrderMarkBigEndian (text)
+                      || CharPointer_UTF16::isByteOrderMarkLittleEndian (text))
+                {
+                    originalText = data.toString();
+                }
+                else
+                {
+                    if (CharPointer_UTF8::isByteOrderMark (text))
+                        text += 3;
+
+                    // parse the input buffer directly to avoid copying it all to a string..
+                    return parseDocumentElement (String::CharPointerType (text), onlyReadOuterDocumentElement);
+                }
+            }
+           #else
+            originalText = data.toString();
+           #endif
+        }
+    }
+
+    return parseDocumentElement (originalText.getCharPointer(), onlyReadOuterDocumentElement);
+}
+
+const String& XmlDocument::getLastParseError() const noexcept
+{
+    return lastError;
+}
+
+void XmlDocument::setLastError (const String& desc, const bool carryOn)
+{
+    lastError = desc;
+    errorOccurred = ! carryOn;
+}
+
+String XmlDocument::getFileContents (const String& filename) const
+{
+    if (inputSource != nullptr)
+    {
+        const ScopedPointer<InputStream> in (inputSource->createInputStreamFor (filename.trim().unquoted()));
+
+        if (in != nullptr)
+            return in->readEntireStreamAsString();
+    }
+
+    return String::empty;
+}
+
+beast_wchar XmlDocument::readNextChar() noexcept
+{
+    const beast_wchar c = input.getAndAdvance();
+
+    if (c == 0)
+    {
+        outOfData = true;
+        --input;
+    }
+
+    return c;
+}
+
+XmlElement* XmlDocument::parseDocumentElement (String::CharPointerType textToParse,
+                                               const bool onlyReadOuterDocumentElement)
+{
+    input = textToParse;
+    errorOccurred = false;
+    outOfData = false;
+    needToLoadDTD = true;
+
+    if (textToParse.isEmpty())
+    {
+        lastError = "not enough input";
+    }
+    else if (! parseHeader())
+    {
+        lastError = "malformed header";
+    }
+    else if (! parseDTD())
+    {
+        lastError = "malformed DTD";
+    }
+    else
+    {
+        lastError = String::empty;
+
+        ScopedPointer<XmlElement> result (readNextElement (! onlyReadOuterDocumentElement));
+
+        if (! errorOccurred)
+            return result.release();
+    }
+
+    return nullptr;
+}
+
+bool XmlDocument::parseHeader()
+{
+    skipNextWhiteSpace();
+
+    if (CharacterFunctions::compareUpTo (input, CharPointer_ASCII ("<?xml"), 5) == 0)
+    {
+        const String::CharPointerType headerEnd (CharacterFunctions::find (input, CharPointer_ASCII ("?>")));
+
+        if (headerEnd.isEmpty())
+            return false;
+
+       #if BEAST_DEBUG
+        const String encoding (String (input, headerEnd)
+                                 .fromFirstOccurrenceOf ("encoding", false, true)
+                                 .fromFirstOccurrenceOf ("=", false, false)
+                                 .fromFirstOccurrenceOf ("\"", false, false)
+                                 .upToFirstOccurrenceOf ("\"", false, false).trim());
+
+        /* If you load an XML document with a non-UTF encoding type, it may have been
+           loaded wrongly.. Since all the files are read via the normal beast file streams,
+           they're treated as UTF-8, so by the time it gets to the parser, the encoding will
+           have been lost. Best plan is to stick to utf-8 or if you have specific files to
+           read, use your own code to convert them to a unicode String, and pass that to the
+           XML parser.
+        */
+        bassert (encoding.isEmpty() || encoding.startsWithIgnoreCase ("utf-"));
+       #endif
+
+        input = headerEnd + 2;
+        skipNextWhiteSpace();
+    }
+
+    return true;
+}
+
+bool XmlDocument::parseDTD()
+{
+    if (CharacterFunctions::compareUpTo (input, CharPointer_ASCII ("<!DOCTYPE"), 9) == 0)
+    {
+        input += 9;
+        const String::CharPointerType dtdStart (input);
+
+        for (int n = 1; n > 0;)
+        {
+            const beast_wchar c = readNextChar();
+
+            if (outOfData)
+                return false;
+
+            if (c == '<')
+                ++n;
+            else if (c == '>')
+                --n;
+        }
+
+        dtdText = String (dtdStart, input - 1).trim();
+    }
+
+    return true;
+}
+
+void XmlDocument::skipNextWhiteSpace()
+{
+    for (;;)
+    {
+        input = input.findEndOfWhitespace();
+
+        if (input.isEmpty())
+        {
+            outOfData = true;
+            break;
+        }
+
+        if (*input == '<')
+        {
+            if (input[1] == '!'
+                 && input[2] == '-'
+                 && input[3] == '-')
+            {
+                input += 4;
+                const int closeComment = input.indexOf (CharPointer_ASCII ("-->"));
+
+                if (closeComment < 0)
+                {
+                    outOfData = true;
+                    break;
+                }
+
+                input += closeComment + 3;
+                continue;
+            }
+            
+            if (input[1] == '?')
+            {
+                input += 2;
+                const int closeBracket = input.indexOf (CharPointer_ASCII ("?>"));
+
+                if (closeBracket < 0)
+                {
+                    outOfData = true;
+                    break;
+                }
+
+                input += closeBracket + 2;
+                continue;
+            }
+        }
+
+        break;
+    }
+}
+
+void XmlDocument::readQuotedString (String& result)
+{
+    const beast_wchar quote = readNextChar();
+
+    while (! outOfData)
+    {
+        const beast_wchar c = readNextChar();
+
+        if (c == quote)
+            break;
+
+        --input;
+
+        if (c == '&')
+        {
+            readEntity (result);
+        }
+        else
+        {
+            const String::CharPointerType start (input);
+
+            for (;;)
+            {
+                const beast_wchar character = *input;
+
+                if (character == quote)
+                {
+                    result.appendCharPointer (start, input);
+                    ++input;
+                    return;
+                }
+                else if (character == '&')
+                {
+                    result.appendCharPointer (start, input);
+                    break;
+                }
+                else if (character == 0)
+                {
+                    outOfData = true;
+                    setLastError ("unmatched quotes", false);
+                    break;
+                }
+
+                ++input;
+            }
+        }
+    }
+}
+
+XmlElement* XmlDocument::readNextElement (const bool alsoParseSubElements)
+{
+    XmlElement* node = nullptr;
+
+    skipNextWhiteSpace();
+    if (outOfData)
+        return nullptr;
+
+    if (*input == '<')
+    {
+        ++input;
+        String::CharPointerType endOfToken (XmlIdentifierChars::findEndOfToken (input));
+
+        if (endOfToken == input)
+        {
+            // no tag name - but allow for a gap after the '<' before giving an error
+            skipNextWhiteSpace();
+            endOfToken = XmlIdentifierChars::findEndOfToken (input);
+
+            if (endOfToken == input)
+            {
+                setLastError ("tag name missing", false);
+                return node;
+            }
+        }
+
+        node = new XmlElement (String (input, endOfToken));
+        input = endOfToken;
+        LinkedListPointer<XmlElement::XmlAttributeNode>::Appender attributeAppender (node->attributes);
+
+        // look for attributes
+        for (;;)
+        {
+            skipNextWhiteSpace();
+
+            const beast_wchar c = *input;
+
+            // empty tag..
+            if (c == '/' && input[1] == '>')
+            {
+                input += 2;
+                break;
+            }
+
+            // parse the guts of the element..
+            if (c == '>')
+            {
+                ++input;
+
+                if (alsoParseSubElements)
+                    readChildElements (node);
+
+                break;
+            }
+
+            // get an attribute..
+            if (XmlIdentifierChars::isIdentifierChar (c))
+            {
+                String::CharPointerType attNameEnd (XmlIdentifierChars::findEndOfToken (input));
+
+                if (attNameEnd != input)
+                {
+                    const String::CharPointerType attNameStart (input);
+                    input = attNameEnd;
+
+                    skipNextWhiteSpace();
+
+                    if (readNextChar() == '=')
+                    {
+                        skipNextWhiteSpace();
+
+                        const beast_wchar nextChar = *input;
+
+                        if (nextChar == '"' || nextChar == '\'')
+                        {
+                            XmlElement::XmlAttributeNode* const newAtt
+                                = new XmlElement::XmlAttributeNode (String (attNameStart, attNameEnd),
+                                                                    String::empty);
+
+                            readQuotedString (newAtt->value);
+                            attributeAppender.append (newAtt);
+                            continue;
+                        }
+                    }
+                    else
+                    {
+                        setLastError ("expected '=' after attribute '"
+                                        + String (attNameStart, attNameEnd) + "'", false);
+                        return node;
+                    }
+                }
+            }
+            else
+            {
+                if (! outOfData)
+                    setLastError ("illegal character found in " + node->getTagName() + ": '" + c + "'", false);
+            }
+
+            break;
+        }
+    }
+
+    return node;
+}
+
+void XmlDocument::readChildElements (XmlElement* parent)
+{
+    LinkedListPointer<XmlElement>::Appender childAppender (parent->firstChildElement);
+
+    for (;;)
+    {
+        const String::CharPointerType preWhitespaceInput (input);
+        skipNextWhiteSpace();
+
+        if (outOfData)
+        {
+            setLastError ("unmatched tags", false);
+            break;
+        }
+
+        if (*input == '<')
+        {
+            const beast_wchar c1 = input[1];
+
+            if (c1 == '/')
+            {
+                // our close tag..
+                const int closeTag = input.indexOf ((beast_wchar) '>');
+
+                if (closeTag >= 0)
+                    input += closeTag + 1;
+
+                break;
+            }
+            
+            if (c1 == '!' && CharacterFunctions::compareUpTo (input + 2, CharPointer_ASCII ("[CDATA["), 7) == 0) 
+            {
+                input += 9;
+                const String::CharPointerType inputStart (input);
+
+                for (;;)
+                {
+                    const beast_wchar c0 = *input;
+
+                    if (c0 == 0)
+                    {
+                        setLastError ("unterminated CDATA section", false);
+                        outOfData = true;
+                        break;
+                    }
+                    else if (c0 == ']'
+                              && input[1] == ']'
+                              && input[2] == '>')
+                    {
+                        childAppender.append (XmlElement::createTextElement (String (inputStart, input)));
+                        input += 3;
+                        break;
+                    }
+
+                    ++input;
+                }
+            }
+            else
+            {
+                // this is some other element, so parse and add it..
+                if (XmlElement* const n = readNextElement (true))
+                    childAppender.append (n);
+                else
+                    break;
+            }
+        }
+        else // must be a character block
+        {
+            input = preWhitespaceInput; // roll back to include the leading whitespace
+            String textElementContent;
+
+            for (;;)
+            {
+                const beast_wchar c = *input;
+
+                if (c == '<')
+                    break;
+
+                if (c == 0)
+                {
+                    setLastError ("unmatched tags", false);
+                    outOfData = true;
+                    return;
+                }
+
+                if (c == '&')
+                {
+                    String entity;
+                    readEntity (entity);
+
+                    if (entity.startsWithChar ('<') && entity [1] != 0)
+                    {
+                        const String::CharPointerType oldInput (input);
+                        const bool oldOutOfData = outOfData;
+
+                        input = entity.getCharPointer();
+                        outOfData = false;
+
+                        for (;;)
+                        {
+                            XmlElement* const n = readNextElement (true);
+
+                            if (n == nullptr)
+                                break;
+
+                            childAppender.append (n);
+                        }
+
+                        input = oldInput;
+                        outOfData = oldOutOfData;
+                    }
+                    else
+                    {
+                        textElementContent += entity;
+                    }
+                }
+                else
+                {
+                    const String::CharPointerType start (input);
+
+                    for (;;)
+                    {
+                        const beast_wchar nextChar = *input;
+
+                        if (nextChar == '<' || nextChar == '&')
+                            break;
+
+                        if (nextChar == 0)
+                        {
+                            setLastError ("unmatched tags", false);
+                            outOfData = true;
+                            return;
+                        }
+
+                        ++input;
+                    }
+
+                    textElementContent.appendCharPointer (start, input);
+                }
+            }
+
+            if ((! ignoreEmptyTextElements) || textElementContent.containsNonWhitespaceChars())
+                childAppender.append (XmlElement::createTextElement (textElementContent));
+        }
+    }
+}
+
+void XmlDocument::readEntity (String& result)
+{
+    // skip over the ampersand
+    ++input;
+
+    if (input.compareIgnoreCaseUpTo (CharPointer_ASCII ("amp;"), 4) == 0)
+    {
+        input += 4;
+        result += '&';
+    }
+    else if (input.compareIgnoreCaseUpTo (CharPointer_ASCII ("quot;"), 5) == 0)
+    {
+        input += 5;
+        result += '"';
+    }
+    else if (input.compareIgnoreCaseUpTo (CharPointer_ASCII ("apos;"), 5) == 0)
+    {
+        input += 5;
+        result += '\'';
+    }
+    else if (input.compareIgnoreCaseUpTo (CharPointer_ASCII ("lt;"), 3) == 0)
+    {
+        input += 3;
+        result += '<';
+    }
+    else if (input.compareIgnoreCaseUpTo (CharPointer_ASCII ("gt;"), 3) == 0)
+    {
+        input += 3;
+        result += '>';
+    }
+    else if (*input == '#')
+    {
+        int charCode = 0;
+        ++input;
+
+        if (*input == 'x' || *input == 'X')
+        {
+            ++input;
+            int numChars = 0;
+
+            while (input[0] != ';')
+            {
+                const int hexValue = CharacterFunctions::getHexDigitValue (input[0]);
+
+                if (hexValue < 0 || ++numChars > 8)
+                {
+                    setLastError ("illegal escape sequence", true);
+                    break;
+                }
+
+                charCode = (charCode << 4) | hexValue;
+                ++input;
+            }
+
+            ++input;
+        }
+        else if (input[0] >= '0' && input[0] <= '9')
+        {
+            int numChars = 0;
+
+            while (input[0] != ';')
+            {
+                if (++numChars > 12)
+                {
+                    setLastError ("illegal escape sequence", true);
+                    break;
+                }
+
+                charCode = charCode * 10 + ((int) input[0] - '0');
+                ++input;
+            }
+
+            ++input;
+        }
+        else
+        {
+            setLastError ("illegal escape sequence", true);
+            result += '&';
+            return;
+        }
+
+        result << (beast_wchar) charCode;
+    }
+    else
+    {
+        const String::CharPointerType entityNameStart (input);
+        const int closingSemiColon = input.indexOf ((beast_wchar) ';');
+
+        if (closingSemiColon < 0)
+        {
+            outOfData = true;
+            result += '&';
+        }
+        else
+        {
+            input += closingSemiColon + 1;
+
+            result += expandExternalEntity (String (entityNameStart, (size_t) closingSemiColon));
+        }
+    }
+}
+
+String XmlDocument::expandEntity (const String& ent)
+{
+    if (ent.equalsIgnoreCase ("amp")) return String::charToString ('&');
+    if (ent.equalsIgnoreCase ("quot")) return String::charToString ('"');
+    if (ent.equalsIgnoreCase ("apos")) return String::charToString ('\'');
+    if (ent.equalsIgnoreCase ("lt")) return String::charToString ('<');
+    if (ent.equalsIgnoreCase ("gt")) return String::charToString ('>');
+
+    if (ent[0] == '#')
+    {
+        const beast_wchar char1 = ent[1];
+
+        if (char1 == 'x' || char1 == 'X')
+            return String::charToString (static_cast <beast_wchar> (ent.substring (2).getHexValue32()));
+
+        if (char1 >= '0' && char1 <= '9')
+            return String::charToString (static_cast <beast_wchar> (ent.substring (1).getIntValue()));
+
+        setLastError ("illegal escape sequence", false);
+        return String::charToString ('&');
+    }
+
+    return expandExternalEntity (ent);
+}
+
+String XmlDocument::expandExternalEntity (const String& entity)
+{
+    if (needToLoadDTD)
+    {
+        if (dtdText.isNotEmpty())
+        {
+            dtdText = dtdText.trimCharactersAtEnd (">");
+            tokenisedDTD.addTokens (dtdText, true);
+
+            if (tokenisedDTD [tokenisedDTD.size() - 2].equalsIgnoreCase ("system")
+                 && tokenisedDTD [tokenisedDTD.size() - 1].isQuotedString())
+            {
+                const String fn (tokenisedDTD [tokenisedDTD.size() - 1]);
+
+                tokenisedDTD.clear();
+                tokenisedDTD.addTokens (getFileContents (fn), true);
+            }
+            else
+            {
+                tokenisedDTD.clear();
+                const int openBracket = dtdText.indexOfChar ('[');
+
+                if (openBracket > 0)
+                {
+                    const int closeBracket = dtdText.lastIndexOfChar (']');
+
+                    if (closeBracket > openBracket)
+                        tokenisedDTD.addTokens (dtdText.substring (openBracket + 1,
+                                                                   closeBracket), true);
+                }
+            }
+
+            for (int i = tokenisedDTD.size(); --i >= 0;)
+            {
+                if (tokenisedDTD[i].startsWithChar ('%')
+                     && tokenisedDTD[i].endsWithChar (';'))
+                {
+                    const String parsed (getParameterEntity (tokenisedDTD[i].substring (1, tokenisedDTD[i].length() - 1)));
+                    StringArray newToks;
+                    newToks.addTokens (parsed, true);
+
+                    tokenisedDTD.remove (i);
+
+                    for (int j = newToks.size(); --j >= 0;)
+                        tokenisedDTD.insert (i, newToks[j]);
+                }
+            }
+        }
+
+        needToLoadDTD = false;
+    }
+
+    for (int i = 0; i < tokenisedDTD.size(); ++i)
+    {
+        if (tokenisedDTD[i] == entity)
+        {
+            if (tokenisedDTD[i - 1].equalsIgnoreCase ("<!entity"))
+            {
+                String ent (tokenisedDTD [i + 1].trimCharactersAtEnd (">").trim().unquoted());
+
+                // check for sub-entities..
+                int ampersand = ent.indexOfChar ('&');
+
+                while (ampersand >= 0)
+                {
+                    const int semiColon = ent.indexOf (i + 1, ";");
+
+                    if (semiColon < 0)
+                    {
+                        setLastError ("entity without terminating semi-colon", false);
+                        break;
+                    }
+
+                    const String resolved (expandEntity (ent.substring (i + 1, semiColon)));
+
+                    ent = ent.substring (0, ampersand)
+                           + resolved
+                           + ent.substring (semiColon + 1);
+
+                    ampersand = ent.indexOfChar (semiColon + 1, '&');
+                }
+
+                return ent;
+            }
+        }
+    }
+
+    setLastError ("unknown entity", true);
+
+    return entity;
+}
+
+String XmlDocument::getParameterEntity (const String& entity)
+{
+    for (int i = 0; i < tokenisedDTD.size(); ++i)
+    {
+        if (tokenisedDTD[i] == entity
+             && tokenisedDTD [i - 1] == "%"
+             && tokenisedDTD [i - 2].equalsIgnoreCase ("<!entity"))
+        {
+            const String ent (tokenisedDTD [i + 1].trimCharactersAtEnd (">"));
+
+            if (ent.equalsIgnoreCase ("system"))
+                return getFileContents (tokenisedDTD [i + 2].trimCharactersAtEnd (">"));
+
+            return ent.trim().unquoted();
+        }
+    }
+
+    return entity;
+}