| /* |
| * Copyright (C) 2000 Peter Kelly (pmk@post.com) |
| * Copyright (C) 2005, 2006, 2008 Apple Inc. All rights reserved. |
| * Copyright (C) 2006 Alexey Proskuryakov (ap@webkit.org) |
| * Copyright (C) 2007 Samuel Weinig (sam@webkit.org) |
| * Copyright (C) 2008 Nokia Corporation and/or its subsidiary(-ies) |
| * Copyright (C) 2008 Holger Hans Peter Freyther |
| * Copyright (C) 2008 Torch Mobile Inc. All rights reserved. (http://www.torchmobile.com/) |
| * |
| * This library is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU Library General Public |
| * License as published by the Free Software Foundation; either |
| * version 2 of the License, or (at your option) any later version. |
| * |
| * This library is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * Library General Public License for more details. |
| * |
| * You should have received a copy of the GNU Library General Public License |
| * along with this library; see the file COPYING.LIB. If not, write to |
| * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, |
| * Boston, MA 02110-1301, USA. |
| */ |
| |
| #include "config.h" |
| #include "XMLDocumentParser.h" |
| |
| #include "CDATASection.h" |
| #include "CachedScript.h" |
| #include "Comment.h" |
| #include "CachedResourceLoader.h" |
| #include "Document.h" |
| #include "DocumentFragment.h" |
| #include "DocumentType.h" |
| #include "Frame.h" |
| #include "FrameLoader.h" |
| #include "FrameView.h" |
| #include "HTMLLinkElement.h" |
| #include "HTMLNames.h" |
| #include "HTMLStyleElement.h" |
| #include "ImageLoader.h" |
| #include "ProcessingInstruction.h" |
| #include "ResourceError.h" |
| #include "ResourceHandle.h" |
| #include "ResourceRequest.h" |
| #include "ResourceResponse.h" |
| #include "ScriptController.h" |
| #include "ScriptElement.h" |
| #include "ScriptSourceCode.h" |
| #include "ScriptValue.h" |
| #include "TextResourceDecoder.h" |
| #include "TreeDepthLimit.h" |
| #include <wtf/text/StringConcatenate.h> |
| #include <wtf/StringExtras.h> |
| #include <wtf/Threading.h> |
| #include <wtf/Vector.h> |
| |
| #if ENABLE(SVG) |
| #include "SVGNames.h" |
| #include "SVGStyleElement.h" |
| #endif |
| |
| using namespace std; |
| |
| namespace WebCore { |
| |
| using namespace HTMLNames; |
| |
| const int maxErrors = 25; |
| |
| #if ENABLE(WML) |
| bool XMLDocumentParser::isWMLDocument() const |
| { |
| return document()->isWMLDocument(); |
| } |
| #endif |
| |
| void XMLDocumentParser::pushCurrentNode(Node* n) |
| { |
| ASSERT(n); |
| ASSERT(m_currentNode); |
| if (n != document()) |
| n->ref(); |
| m_currentNodeStack.append(m_currentNode); |
| m_currentNode = n; |
| if (m_currentNodeStack.size() > maxDOMTreeDepth) |
| handleError(fatal, "Excessive node nesting.", lineNumber(), columnNumber()); |
| } |
| |
| void XMLDocumentParser::popCurrentNode() |
| { |
| if (!m_currentNode) |
| return; |
| ASSERT(m_currentNodeStack.size()); |
| |
| if (m_currentNode != document()) |
| m_currentNode->deref(); |
| |
| m_currentNode = m_currentNodeStack.last(); |
| m_currentNodeStack.removeLast(); |
| } |
| |
| void XMLDocumentParser::clearCurrentNodeStack() |
| { |
| if (m_currentNode && m_currentNode != document()) |
| m_currentNode->deref(); |
| m_currentNode = 0; |
| |
| if (m_currentNodeStack.size()) { // Aborted parsing. |
| for (size_t i = m_currentNodeStack.size() - 1; i != 0; --i) |
| m_currentNodeStack[i]->deref(); |
| if (m_currentNodeStack[0] && m_currentNodeStack[0] != document()) |
| m_currentNodeStack[0]->deref(); |
| m_currentNodeStack.clear(); |
| } |
| } |
| |
| void XMLDocumentParser::insert(const SegmentedString&) |
| { |
| ASSERT_NOT_REACHED(); |
| } |
| |
| void XMLDocumentParser::append(const SegmentedString& s) |
| { |
| String parseString = s.toString(); |
| |
| if (m_sawXSLTransform || !m_sawFirstElement) |
| m_originalSourceForTransform += parseString; |
| |
| if (isStopped() || m_sawXSLTransform) |
| return; |
| |
| if (m_parserPaused) { |
| m_pendingSrc.append(s); |
| return; |
| } |
| |
| doWrite(s.toString()); |
| |
| // After parsing, go ahead and dispatch image beforeload events. |
| ImageLoader::dispatchPendingBeforeLoadEvents(); |
| } |
| |
| void XMLDocumentParser::handleError(ErrorType type, const char* m, int lineNumber, int columnNumber) |
| { |
| handleError(type, m, TextPosition1(WTF::OneBasedNumber::fromOneBasedInt(lineNumber), WTF::OneBasedNumber::fromOneBasedInt(columnNumber))); |
| } |
| |
| void XMLDocumentParser::handleError(ErrorType type, const char* m, TextPosition1 position) |
| { |
| if (type == fatal || (m_errorCount < maxErrors && m_lastErrorPosition.m_line != position.m_line && m_lastErrorPosition.m_column != position.m_column)) { |
| switch (type) { |
| case warning: |
| m_errorMessages += makeString("warning on line ", String::number(position.m_line.oneBasedInt()), " at column ", String::number(position.m_column.oneBasedInt()), ": ", m); |
| break; |
| case fatal: |
| case nonFatal: |
| m_errorMessages += makeString("error on line ", String::number(position.m_line.oneBasedInt()), " at column ", String::number(position.m_column.oneBasedInt()), ": ", m); |
| } |
| |
| m_lastErrorPosition = position; |
| ++m_errorCount; |
| } |
| |
| if (type != warning) |
| m_sawError = true; |
| |
| if (type == fatal) |
| stopParsing(); |
| } |
| |
| void XMLDocumentParser::enterText() |
| { |
| #if !USE(QXMLSTREAM) |
| ASSERT(m_bufferedText.size() == 0); |
| #endif |
| RefPtr<Node> newNode = Text::create(document(), ""); |
| m_currentNode->deprecatedParserAddChild(newNode.get()); |
| pushCurrentNode(newNode.get()); |
| } |
| |
| #if !USE(QXMLSTREAM) |
| static inline String toString(const xmlChar* string, size_t size) |
| { |
| return String::fromUTF8(reinterpret_cast<const char*>(string), size); |
| } |
| #endif |
| |
| |
| void XMLDocumentParser::exitText() |
| { |
| if (isStopped()) |
| return; |
| |
| if (!m_currentNode || !m_currentNode->isTextNode()) |
| return; |
| |
| #if !USE(QXMLSTREAM) |
| ExceptionCode ec = 0; |
| static_cast<Text*>(m_currentNode)->appendData(toString(m_bufferedText.data(), m_bufferedText.size()), ec); |
| Vector<xmlChar> empty; |
| m_bufferedText.swap(empty); |
| #endif |
| |
| if (m_view && m_currentNode && !m_currentNode->attached()) |
| m_currentNode->attach(); |
| |
| popCurrentNode(); |
| } |
| |
| void XMLDocumentParser::detach() |
| { |
| clearCurrentNodeStack(); |
| ScriptableDocumentParser::detach(); |
| } |
| |
| void XMLDocumentParser::end() |
| { |
| // XMLDocumentParserLibxml2 will do bad things to the document if doEnd() is called. |
| // I don't believe XMLDocumentParserQt needs doEnd called in the fragment case. |
| ASSERT(!m_parsingFragment); |
| |
| doEnd(); |
| |
| // doEnd() could process a script tag, thus pausing parsing. |
| if (m_parserPaused) |
| return; |
| |
| if (m_sawError) |
| insertErrorMessageBlock(); |
| else { |
| exitText(); |
| document()->styleSelectorChanged(RecalcStyleImmediately); |
| } |
| |
| if (isParsing()) |
| prepareToStopParsing(); |
| document()->setReadyState(Document::Interactive); |
| clearCurrentNodeStack(); |
| document()->finishedParsing(); |
| } |
| |
| void XMLDocumentParser::finish() |
| { |
| // FIXME: We should ASSERT(!m_parserStopped) here, since it does not |
| // makes sense to call any methods on DocumentParser once it's been stopped. |
| // However, FrameLoader::stop calls Document::finishParsing unconditionally |
| // which in turn calls m_parser->finish(). |
| |
| if (m_parserPaused) |
| m_finishCalled = true; |
| else |
| end(); |
| } |
| |
| bool XMLDocumentParser::finishWasCalled() |
| { |
| return m_finishCalled; |
| } |
| |
| static inline RefPtr<Element> createXHTMLParserErrorHeader(Document* doc, const String& errorMessages) |
| { |
| RefPtr<Element> reportElement = doc->createElement(QualifiedName(nullAtom, "parsererror", xhtmlNamespaceURI), false); |
| reportElement->setAttribute(styleAttr, "display: block; white-space: pre; border: 2px solid #c77; padding: 0 1em 0 1em; margin: 1em; background-color: #fdd; color: black"); |
| |
| ExceptionCode ec = 0; |
| RefPtr<Element> h3 = doc->createElement(h3Tag, false); |
| reportElement->appendChild(h3.get(), ec); |
| h3->appendChild(doc->createTextNode("This page contains the following errors:"), ec); |
| |
| RefPtr<Element> fixed = doc->createElement(divTag, false); |
| reportElement->appendChild(fixed.get(), ec); |
| fixed->setAttribute(styleAttr, "font-family:monospace;font-size:12px"); |
| fixed->appendChild(doc->createTextNode(errorMessages), ec); |
| |
| h3 = doc->createElement(h3Tag, false); |
| reportElement->appendChild(h3.get(), ec); |
| h3->appendChild(doc->createTextNode("Below is a rendering of the page up to the first error."), ec); |
| |
| return reportElement; |
| } |
| |
| void XMLDocumentParser::insertErrorMessageBlock() |
| { |
| #if USE(QXMLSTREAM) |
| if (m_parsingFragment) |
| return; |
| #endif |
| // One or more errors occurred during parsing of the code. Display an error block to the user above |
| // the normal content (the DOM tree is created manually and includes line/col info regarding |
| // where the errors are located) |
| |
| // Create elements for display |
| ExceptionCode ec = 0; |
| Document* document = this->document(); |
| RefPtr<Element> documentElement = document->documentElement(); |
| if (!documentElement) { |
| RefPtr<Element> rootElement = document->createElement(htmlTag, false); |
| document->appendChild(rootElement, ec); |
| RefPtr<Element> body = document->createElement(bodyTag, false); |
| rootElement->appendChild(body, ec); |
| documentElement = body.get(); |
| } |
| #if ENABLE(SVG) |
| else if (documentElement->namespaceURI() == SVGNames::svgNamespaceURI) { |
| RefPtr<Element> rootElement = document->createElement(htmlTag, false); |
| RefPtr<Element> body = document->createElement(bodyTag, false); |
| rootElement->appendChild(body, ec); |
| body->appendChild(documentElement, ec); |
| document->appendChild(rootElement.get(), ec); |
| documentElement = body.get(); |
| } |
| #endif |
| #if ENABLE(WML) |
| else if (isWMLDocument()) { |
| RefPtr<Element> rootElement = document->createElement(htmlTag, false); |
| RefPtr<Element> body = document->createElement(bodyTag, false); |
| rootElement->appendChild(body, ec); |
| body->appendChild(documentElement, ec); |
| document->appendChild(rootElement.get(), ec); |
| documentElement = body.get(); |
| } |
| #endif |
| |
| RefPtr<Element> reportElement = createXHTMLParserErrorHeader(document, m_errorMessages); |
| documentElement->insertBefore(reportElement, documentElement->firstChild(), ec); |
| #if ENABLE(XSLT) |
| if (document->transformSourceDocument()) { |
| RefPtr<Element> paragraph = document->createElement(pTag, false); |
| paragraph->setAttribute(styleAttr, "white-space: normal"); |
| paragraph->appendChild(document->createTextNode("This document was created as the result of an XSL transformation. The line and column numbers given are from the transformed result."), ec); |
| reportElement->appendChild(paragraph.release(), ec); |
| } |
| #endif |
| document->updateStyleIfNeeded(); |
| } |
| |
| void XMLDocumentParser::notifyFinished(CachedResource* unusedResource) |
| { |
| ASSERT_UNUSED(unusedResource, unusedResource == m_pendingScript); |
| ASSERT(m_pendingScript->accessCount() > 0); |
| |
| ScriptSourceCode sourceCode(m_pendingScript.get()); |
| bool errorOccurred = m_pendingScript->errorOccurred(); |
| |
| m_pendingScript->removeClient(this); |
| m_pendingScript = 0; |
| |
| RefPtr<Element> e = m_scriptElement; |
| m_scriptElement = 0; |
| |
| ScriptElement* scriptElement = toScriptElement(e.get()); |
| ASSERT(scriptElement); |
| |
| // JavaScript can detach this parser, make sure it's kept alive even if detached. |
| RefPtr<XMLDocumentParser> protect(this); |
| |
| if (errorOccurred) |
| scriptElement->dispatchErrorEvent(); |
| else { |
| scriptElement->executeScript(sourceCode); |
| scriptElement->dispatchLoadEvent(); |
| } |
| |
| m_scriptElement = 0; |
| |
| if (!isDetached() && !m_requestingScript) |
| resumeParsing(); |
| } |
| |
| bool XMLDocumentParser::isWaitingForScripts() const |
| { |
| return m_pendingScript; |
| } |
| |
| void XMLDocumentParser::pauseParsing() |
| { |
| if (m_parsingFragment) |
| return; |
| |
| m_parserPaused = true; |
| } |
| |
| bool XMLDocumentParser::parseDocumentFragment(const String& chunk, DocumentFragment* fragment, Element* contextElement, FragmentScriptingPermission scriptingPermission) |
| { |
| if (!chunk.length()) |
| return true; |
| |
| // FIXME: We need to implement the HTML5 XML Fragment parsing algorithm: |
| // http://www.whatwg.org/specs/web-apps/current-work/multipage/the-xhtml-syntax.html#xml-fragment-parsing-algorithm |
| // For now we have a hack for script/style innerHTML support: |
| if (contextElement && (contextElement->hasLocalName(HTMLNames::scriptTag) || contextElement->hasLocalName(HTMLNames::styleTag))) { |
| fragment->parserAddChild(fragment->document()->createTextNode(chunk)); |
| return true; |
| } |
| |
| RefPtr<XMLDocumentParser> parser = XMLDocumentParser::create(fragment, contextElement, scriptingPermission); |
| bool wellFormed = parser->appendFragmentSource(chunk); |
| // Do not call finish(). Current finish() and doEnd() implementations touch the main Document/loader |
| // and can cause crashes in the fragment case. |
| parser->detach(); // Allows ~DocumentParser to assert it was detached before destruction. |
| return wellFormed; // appendFragmentSource()'s wellFormed is more permissive than wellFormed(). |
| } |
| |
| } // namespace WebCore |