Source/WebCore/html/parser/HTMLConstructionSite.cpp - platform/external/chromium_org/third_party/WebKit - Git at Google

 /*
  * Copyright (C) 2010 Google, Inc. All Rights Reserved.
  * Copyright (C) 2011 Apple Inc. All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY GOOGLE INC. ``AS IS'' AND ANY
  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL GOOGLE INC. OR
  * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
  * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
  * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
  * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */

 #include "config.h"
 #include "HTMLTreeBuilder.h"

 #include "Comment.h"
 #include "DocumentFragment.h"
 #include "DocumentType.h"
 #include "Element.h"
 #include "Frame.h"
 #include "HTMLDocument.h"
 #include "HTMLElementFactory.h"
 #include "HTMLFormElement.h"
 #include "HTMLHtmlElement.h"
 #include "HTMLNames.h"
 #include "HTMLParserIdioms.h"
 #include "HTMLScriptElement.h"
 #include "HTMLStackItem.h"
 #include "HTMLToken.h"
 #include "HTMLTokenizer.h"
 #include "LocalizedStrings.h"
 #if ENABLE(MATHML)
 #include "MathMLNames.h"
 #endif
 #include "NotImplemented.h"
 #if ENABLE(SVG)
 #include "SVGNames.h"
 #endif
 #include "Settings.h"
 #include "Text.h"
 #include <wtf/UnusedParam.h>

 namespace WebCore {

 using namespace HTMLNames;

 static bool hasImpliedEndTag(const HTMLStackItem* item)
 {
     return item->hasTagName(ddTag)
         || item->hasTagName(dtTag)
         || item->hasTagName(liTag)
         || item->hasTagName(optionTag)
         || item->hasTagName(optgroupTag)
         || item->hasTagName(pTag)
         || item->hasTagName(rpTag)
         || item->hasTagName(rtTag);
 }

 static inline bool isAllWhitespace(const String& string)
 {
     return string.isAllSpecialCharacters<isHTMLSpace>();
 }

 static inline void executeTask(HTMLConstructionSiteTask& task)
 {
     if (task.nextChild)
         task.parent->parserInsertBefore(task.child.get(), task.nextChild.get());
     else
         task.parent->parserAppendChild(task.child.get());

     // JavaScript run from beforeload (or DOM Mutation or event handlers)
     // might have removed the child, in which case we should not attach it.

     if (task.child->parentNode() && task.parent->attached() && !task.child->attached())
         task.child->attach();

     task.child->beginParsingChildren();

     if (task.selfClosing)
         task.child->finishParsingChildren();
 }

 void HTMLConstructionSite::attachLater(ContainerNode* parent, PassRefPtr<Node> prpChild, bool selfClosing)
 {
     HTMLConstructionSiteTask task;
     task.parent = parent;
     task.child = prpChild;
     task.selfClosing = selfClosing;

     if (shouldFosterParent()) {
         fosterParent(task.child);
         return;
     }

     // Add as a sibling of the parent if we have reached the maximum depth allowed.
     if (m_openElements.stackDepth() > m_maximumDOMTreeDepth && task.parent->parentNode())
         task.parent = task.parent->parentNode();

     ASSERT(task.parent);
     m_attachmentQueue.append(task);
 }

 void HTMLConstructionSite::executeQueuedTasks()
 {
     const size_t size = m_attachmentQueue.size();
     if (!size)
         return;

     // Copy the task queue into a local variable in case executeTask
     // re-enters the parser.
     AttachmentQueue queue;
     queue.swap(m_attachmentQueue);

     for (size_t i = 0; i < size; ++i)
         executeTask(queue[i]);

     // We might be detached now.
 }

 HTMLConstructionSite::HTMLConstructionSite(Document* document, unsigned maximumDOMTreeDepth)
     : m_document(document)
     , m_attachmentRoot(document)
     , m_fragmentScriptingPermission(AllowScriptingContent)
     , m_isParsingFragment(false)
     , m_redirectAttachToFosterParent(false)
     , m_maximumDOMTreeDepth(maximumDOMTreeDepth)
 {
 }

 HTMLConstructionSite::HTMLConstructionSite(DocumentFragment* fragment, FragmentScriptingPermission scriptingPermission, unsigned maximumDOMTreeDepth)
     : m_document(fragment->document())
     , m_attachmentRoot(fragment)
     , m_fragmentScriptingPermission(scriptingPermission)
     , m_isParsingFragment(true)
     , m_redirectAttachToFosterParent(false)
     , m_maximumDOMTreeDepth(maximumDOMTreeDepth)
 {
 }

 HTMLConstructionSite::~HTMLConstructionSite()
 {
 }

 void HTMLConstructionSite::detach()
 {
     m_document = 0;
     m_attachmentRoot = 0;
 }

 void HTMLConstructionSite::setForm(HTMLFormElement* form)
 {
     // This method should only be needed for HTMLTreeBuilder in the fragment case.
     ASSERT(!m_form);
     m_form = form;
 }

 PassRefPtr<HTMLFormElement> HTMLConstructionSite::takeForm()
 {
     return m_form.release();
 }

 void HTMLConstructionSite::dispatchDocumentElementAvailableIfNeeded()
 {
     ASSERT(m_document);
     if (m_document->frame() && !m_isParsingFragment)
         m_document->frame()->loader()->dispatchDocumentElementAvailable();
 }

 void HTMLConstructionSite::insertHTMLHtmlStartTagBeforeHTML(AtomicHTMLToken* token)
 {
     RefPtr<HTMLHtmlElement> element = HTMLHtmlElement::create(m_document);
     element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
     attachLater(m_attachmentRoot, element);
     m_openElements.pushHTMLHtmlElement(HTMLStackItem::create(element, token));

     executeQueuedTasks();
     element->insertedByParser();
     dispatchDocumentElementAvailableIfNeeded();
 }

 void HTMLConstructionSite::mergeAttributesFromTokenIntoElement(AtomicHTMLToken* token, Element* element)
 {
     if (token->attributes().isEmpty())
         return;

     ElementAttributeData* elementAttributeData = element->mutableAttributeData();

     for (unsigned i = 0; i < token->attributes().size(); ++i) {
         const Attribute& tokenAttribute = token->attributes().at(i);
         if (!elementAttributeData->getAttributeItem(tokenAttribute.name()))
             element->setAttribute(tokenAttribute.name(), tokenAttribute.value());
     }
 }

 void HTMLConstructionSite::insertHTMLHtmlStartTagInBody(AtomicHTMLToken* token)
 {
     // Fragments do not have a root HTML element, so any additional HTML elements
     // encountered during fragment parsing should be ignored.
     if (m_isParsingFragment)
         return;

     mergeAttributesFromTokenIntoElement(token, m_openElements.htmlElement());
 }

 void HTMLConstructionSite::insertHTMLBodyStartTagInBody(AtomicHTMLToken* token)
 {
     mergeAttributesFromTokenIntoElement(token, m_openElements.bodyElement());
 }

 void HTMLConstructionSite::insertDoctype(AtomicHTMLToken* token)
 {
     ASSERT(token->type() == HTMLTokenTypes::DOCTYPE);

     RefPtr<DocumentType> doctype = DocumentType::create(m_document, token->name(), String::adopt(token->publicIdentifier()), String::adopt(token->systemIdentifier()));
     attachLater(m_attachmentRoot, doctype.release());

     // DOCTYPE nodes are only processed when parsing fragments w/o contextElements, which
     // never occurs.  However, if we ever chose to support such, this code is subtly wrong,
     // because context-less fragments can determine their own quirks mode, and thus change
     // parsing rules (like <p> inside <table>).  For now we ASSERT that we never hit this code
     // in a fragment, as changing the owning document's compatibility mode would be wrong.
     ASSERT(!m_isParsingFragment);
     if (m_isParsingFragment)
         return;

     if (token->forceQuirks())
         m_document->setCompatibilityMode(Document::QuirksMode);
     else {
         // We need to actually add the Doctype node to the DOM.
         executeQueuedTasks();
         m_document->setCompatibilityModeFromDoctype();
     }
 }

 void HTMLConstructionSite::insertComment(AtomicHTMLToken* token)
 {
     ASSERT(token->type() == HTMLTokenTypes::Comment);
     attachLater(currentNode(), Comment::create(currentNode()->document(), token->comment()));
 }

 void HTMLConstructionSite::insertCommentOnDocument(AtomicHTMLToken* token)
 {
     ASSERT(token->type() == HTMLTokenTypes::Comment);
     attachLater(m_attachmentRoot, Comment::create(m_document, token->comment()));
 }

 void HTMLConstructionSite::insertCommentOnHTMLHtmlElement(AtomicHTMLToken* token)
 {
     ASSERT(token->type() == HTMLTokenTypes::Comment);
     ContainerNode* parent = m_openElements.rootNode();
     attachLater(parent, Comment::create(parent->document(), token->comment()));
 }

 void HTMLConstructionSite::insertHTMLHeadElement(AtomicHTMLToken* token)
 {
     ASSERT(!shouldFosterParent());
     m_head = HTMLStackItem::create(createHTMLElement(token), token);
     attachLater(currentNode(), m_head->element());
     m_openElements.pushHTMLHeadElement(m_head);
 }

 void HTMLConstructionSite::insertHTMLBodyElement(AtomicHTMLToken* token)
 {
     ASSERT(!shouldFosterParent());
     RefPtr<Element> body = createHTMLElement(token);
     attachLater(currentNode(), body);
     m_openElements.pushHTMLBodyElement(HTMLStackItem::create(body.release(), token));
 }

 void HTMLConstructionSite::insertHTMLFormElement(AtomicHTMLToken* token, bool isDemoted)
 {
     RefPtr<Element> element = createHTMLElement(token);
     ASSERT(element->hasTagName(formTag));
     m_form = static_pointer_cast<HTMLFormElement>(element.release());
     m_form->setDemoted(isDemoted);
     attachLater(currentNode(), m_form);
     m_openElements.push(HTMLStackItem::create(m_form, token));
 }

 void HTMLConstructionSite::insertHTMLElement(AtomicHTMLToken* token)
 {
     RefPtr<Element> element = createHTMLElement(token);
     attachLater(currentNode(), element);
     m_openElements.push(HTMLStackItem::create(element.release(), token));
 }

 void HTMLConstructionSite::insertSelfClosingHTMLElement(AtomicHTMLToken* token)
 {
     ASSERT(token->type() == HTMLTokenTypes::StartTag);
     // Normally HTMLElementStack is responsible for calling finishParsingChildren,
     // but self-closing elements are never in the element stack so the stack
     // doesn't get a chance to tell them that we're done parsing their children.
     attachLater(currentNode(), createHTMLElement(token), true);
     // FIXME: Do we want to acknowledge the token's self-closing flag?
     // http://www.whatwg.org/specs/web-apps/current-work/multipage/tokenization.html#acknowledge-self-closing-flag
 }

 void HTMLConstructionSite::insertFormattingElement(AtomicHTMLToken* token)
 {
     // http://www.whatwg.org/specs/web-apps/current-work/multipage/parsing.html#the-stack-of-open-elements
     // Possible active formatting elements include:
     // a, b, big, code, em, font, i, nobr, s, small, strike, strong, tt, and u.
     insertHTMLElement(token);
     m_activeFormattingElements.append(currentElementRecord()->stackItem());
 }

 void HTMLConstructionSite::insertScriptElement(AtomicHTMLToken* token)
 {
     // http://www.whatwg.org/specs/web-apps/current-work/multipage/scripting-1.html#already-started
     // http://html5.org/specs/dom-parsing.html#dom-range-createcontextualfragment
     // For createContextualFragment, the specifications say to mark it parser-inserted and already-started and later unmark them.
     // However, we short circuit that logic to avoid the subtree traversal to find script elements since scripts can never see
     // those flags or effects thereof.
     const bool parserInserted = m_fragmentScriptingPermission != AllowScriptingContentAndDoNotMarkAlreadyStarted;
     const bool alreadyStarted = m_isParsingFragment && parserInserted;
     RefPtr<HTMLScriptElement> element = HTMLScriptElement::create(scriptTag, currentNode()->document(), parserInserted, alreadyStarted);
     if (m_fragmentScriptingPermission != DisallowScriptingContent)
         element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
     attachLater(currentNode(), element);
     m_openElements.push(HTMLStackItem::create(element.release(), token));
 }

 void HTMLConstructionSite::insertForeignElement(AtomicHTMLToken* token, const AtomicString& namespaceURI)
 {
     ASSERT(token->type() == HTMLTokenTypes::StartTag);
     notImplemented(); // parseError when xmlns or xmlns:xlink are wrong.

     RefPtr<Element> element = createElement(token, namespaceURI);
     attachLater(currentNode(), element, token->selfClosing());
     if (!token->selfClosing())
         m_openElements.push(HTMLStackItem::create(element.release(), token, namespaceURI));
 }

 void HTMLConstructionSite::insertTextNode(const String& characters, WhitespaceMode whitespaceMode)
 {
     HTMLConstructionSiteTask task;
     task.parent = currentNode();

     if (shouldFosterParent())
         findFosterSite(task);

     // Strings composed entirely of whitespace are likely to be repeated.
     // Turn them into AtomicString so we share a single string for each.
     bool shouldUseAtomicString = whitespaceMode == AllWhitespace
         || (whitespaceMode == WhitespaceUnknown && isAllWhitespace(characters));

     unsigned currentPosition = 0;

     // FIXME: Splitting text nodes into smaller chunks contradicts HTML5 spec, but is currently necessary
     // for performance, see <https://bugs.webkit.org/show_bug.cgi?id=55898>.

     Node* previousChild = task.nextChild ? task.nextChild->previousSibling() : task.parent->lastChild();
     if (previousChild && previousChild->isTextNode()) {
         // FIXME: We're only supposed to append to this text node if it
         // was the last text node inserted by the parser.
         CharacterData* textNode = static_cast<CharacterData*>(previousChild);
         currentPosition = textNode->parserAppendData(characters, 0, Text::defaultLengthLimit);
     }

     while (currentPosition < characters.length()) {
         RefPtr<Text> textNode = Text::createWithLengthLimit(task.parent->document(), shouldUseAtomicString ? AtomicString(characters).string() : characters, currentPosition);
         // If we have a whole string of unbreakable characters the above could lead to an infinite loop. Exceeding the length limit is the lesser evil.
         if (!textNode->length()) {
             String substring = characters.substring(currentPosition);
             textNode = Text::create(task.parent->document(), shouldUseAtomicString ? AtomicString(substring).string() : substring);
         }

         currentPosition += textNode->length();
         ASSERT(currentPosition <= characters.length());
         task.child = textNode.release();
         executeTask(task);
     }
 }

 PassRefPtr<Element> HTMLConstructionSite::createElement(AtomicHTMLToken* token, const AtomicString& namespaceURI)
 {
     QualifiedName tagName(nullAtom, token->name(), namespaceURI);
     RefPtr<Element> element = currentNode()->document()->createElement(tagName, true);
     element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
     return element.release();
 }

 PassRefPtr<Element> HTMLConstructionSite::createHTMLElement(AtomicHTMLToken* token)
 {
     QualifiedName tagName(nullAtom, token->name(), xhtmlNamespaceURI);
     // FIXME: This can't use HTMLConstructionSite::createElement because we
     // have to pass the current form element.  We should rework form association
     // to occur after construction to allow better code sharing here.
     RefPtr<Element> element = HTMLElementFactory::createHTMLElement(tagName, currentNode()->document(), form(), true);
     element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
     ASSERT(element->isHTMLElement());
     return element.release();
 }

 PassRefPtr<HTMLStackItem> HTMLConstructionSite::createElementFromSavedToken(HTMLStackItem* item)
 {
     RefPtr<Element> element;
     if (item->namespaceURI() == HTMLNames::xhtmlNamespaceURI)
         element = createHTMLElement(item->token());
     else
         element = createElement(item->token(), item->namespaceURI());
     return HTMLStackItem::create(element.release(), item->token(), item->namespaceURI());
 }

 bool HTMLConstructionSite::indexOfFirstUnopenFormattingElement(unsigned& firstUnopenElementIndex) const
 {
     if (m_activeFormattingElements.isEmpty())
         return false;
     unsigned index = m_activeFormattingElements.size();
     do {
         --index;
         const HTMLFormattingElementList::Entry& entry = m_activeFormattingElements.at(index);
         if (entry.isMarker() || m_openElements.contains(entry.element())) {
             firstUnopenElementIndex = index + 1;
             return firstUnopenElementIndex < m_activeFormattingElements.size();
         }
     } while (index);
     firstUnopenElementIndex = index;
     return true;
 }

 void HTMLConstructionSite::reconstructTheActiveFormattingElements()
 {
     unsigned firstUnopenElementIndex;
     if (!indexOfFirstUnopenFormattingElement(firstUnopenElementIndex))
         return;

     unsigned unopenEntryIndex = firstUnopenElementIndex;
     ASSERT(unopenEntryIndex < m_activeFormattingElements.size());
     for (; unopenEntryIndex < m_activeFormattingElements.size(); ++unopenEntryIndex) {
         HTMLFormattingElementList::Entry& unopenedEntry = m_activeFormattingElements.at(unopenEntryIndex);
         RefPtr<HTMLStackItem> reconstructed = createElementFromSavedToken(unopenedEntry.stackItem().get());
         attachLater(currentNode(), reconstructed->node());
         m_openElements.push(reconstructed);
         unopenedEntry.replaceElement(reconstructed.release());
     }
 }

 void HTMLConstructionSite::generateImpliedEndTagsWithExclusion(const AtomicString& tagName)
 {
     while (hasImpliedEndTag(currentStackItem()) && !currentStackItem()->hasLocalName(tagName))
         m_openElements.pop();
 }

 void HTMLConstructionSite::generateImpliedEndTags()
 {
     while (hasImpliedEndTag(currentStackItem()))
         m_openElements.pop();
 }

 void HTMLConstructionSite::findFosterSite(HTMLConstructionSiteTask& task)
 {
     HTMLElementStack::ElementRecord* lastTableElementRecord = m_openElements.topmost(tableTag.localName());
     if (lastTableElementRecord) {
         Element* lastTableElement = lastTableElementRecord->element();
         ContainerNode* parent = lastTableElement->parentNode();
         // When parsing HTML fragments, we skip step 4.2 ("Let root be a new html element with no attributes") for efficiency,
         // and instead use the DocumentFragment as a root node. So we must treat the root node (DocumentFragment) as if it is a html element here.
         if (parent && (parent->isElementNode() || (m_isParsingFragment && parent == m_openElements.rootNode()))) {
             task.parent = parent;
             task.nextChild = lastTableElement;
             return;
         }
         task.parent = lastTableElementRecord->next()->element();
         return;
     }
     // Fragment case
     task.parent = m_openElements.rootNode(); // DocumentFragment
 }

 bool HTMLConstructionSite::shouldFosterParent() const
 {
     return m_redirectAttachToFosterParent
         && currentStackItem()->isElementNode()
         && currentStackItem()->causesFosterParenting();
 }

 void HTMLConstructionSite::fosterParent(PassRefPtr<Node> node)
 {
     HTMLConstructionSiteTask task;
     findFosterSite(task);
     task.child = node;
     ASSERT(task.parent);
     m_attachmentQueue.append(task);
 }

 }
	/*
	* Copyright (C) 2010 Google, Inc. All Rights Reserved.
	* Copyright (C) 2011 Apple Inc. All rights reserved.
	*
	* Redistribution and use in source and binary forms, with or without
	* modification, are permitted provided that the following conditions
	* are met:
	* 1. Redistributions of source code must retain the above copyright
	* notice, this list of conditions and the following disclaimer.
	* 2. Redistributions in binary form must reproduce the above copyright
	* notice, this list of conditions and the following disclaimer in the
	* documentation and/or other materials provided with the distribution.
	*
	* THIS SOFTWARE IS PROVIDED BY GOOGLE INC. ``AS IS'' AND ANY
	* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
	* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
	* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL GOOGLE INC. OR
	* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
	* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
	* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
	* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
	* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
	*/

	#include "config.h"
	#include "HTMLTreeBuilder.h"

	#include "Comment.h"
	#include "DocumentFragment.h"
	#include "DocumentType.h"
	#include "Element.h"
	#include "Frame.h"
	#include "HTMLDocument.h"
	#include "HTMLElementFactory.h"
	#include "HTMLFormElement.h"
	#include "HTMLHtmlElement.h"
	#include "HTMLNames.h"
	#include "HTMLParserIdioms.h"
	#include "HTMLScriptElement.h"
	#include "HTMLStackItem.h"
	#include "HTMLToken.h"
	#include "HTMLTokenizer.h"
	#include "LocalizedStrings.h"
	#if ENABLE(MATHML)
	#include "MathMLNames.h"
	#endif
	#include "NotImplemented.h"
	#if ENABLE(SVG)
	#include "SVGNames.h"
	#endif
	#include "Settings.h"
	#include "Text.h"
	#include <wtf/UnusedParam.h>

	namespace WebCore {

	using namespace HTMLNames;

	static bool hasImpliedEndTag(const HTMLStackItem* item)
	{
	return item->hasTagName(ddTag)
	\|\| item->hasTagName(dtTag)
	\|\| item->hasTagName(liTag)
	\|\| item->hasTagName(optionTag)
	\|\| item->hasTagName(optgroupTag)
	\|\| item->hasTagName(pTag)
	\|\| item->hasTagName(rpTag)
	\|\| item->hasTagName(rtTag);
	}

	static inline bool isAllWhitespace(const String& string)
	{
	return string.isAllSpecialCharacters<isHTMLSpace>();
	}

	static inline void executeTask(HTMLConstructionSiteTask& task)
	{
	if (task.nextChild)
	task.parent->parserInsertBefore(task.child.get(), task.nextChild.get());
	else
	task.parent->parserAppendChild(task.child.get());

	// JavaScript run from beforeload (or DOM Mutation or event handlers)
	// might have removed the child, in which case we should not attach it.

	if (task.child->parentNode() && task.parent->attached() && !task.child->attached())
	task.child->attach();

	task.child->beginParsingChildren();

	if (task.selfClosing)
	task.child->finishParsingChildren();
	}

	void HTMLConstructionSite::attachLater(ContainerNode* parent, PassRefPtr<Node> prpChild, bool selfClosing)
	{
	HTMLConstructionSiteTask task;
	task.parent = parent;
	task.child = prpChild;
	task.selfClosing = selfClosing;

	if (shouldFosterParent()) {
	fosterParent(task.child);
	return;
	}

	// Add as a sibling of the parent if we have reached the maximum depth allowed.
	if (m_openElements.stackDepth() > m_maximumDOMTreeDepth && task.parent->parentNode())
	task.parent = task.parent->parentNode();

	ASSERT(task.parent);
	m_attachmentQueue.append(task);
	}

	void HTMLConstructionSite::executeQueuedTasks()
	{
	const size_t size = m_attachmentQueue.size();
	if (!size)
	return;

	// Copy the task queue into a local variable in case executeTask
	// re-enters the parser.
	AttachmentQueue queue;
	queue.swap(m_attachmentQueue);

	for (size_t i = 0; i < size; ++i)
	executeTask(queue[i]);

	// We might be detached now.
	}

	HTMLConstructionSite::HTMLConstructionSite(Document* document, unsigned maximumDOMTreeDepth)
	: m_document(document)
	, m_attachmentRoot(document)
	, m_fragmentScriptingPermission(AllowScriptingContent)
	, m_isParsingFragment(false)
	, m_redirectAttachToFosterParent(false)
	, m_maximumDOMTreeDepth(maximumDOMTreeDepth)
	{
	}

	HTMLConstructionSite::HTMLConstructionSite(DocumentFragment* fragment, FragmentScriptingPermission scriptingPermission, unsigned maximumDOMTreeDepth)
	: m_document(fragment->document())
	, m_attachmentRoot(fragment)
	, m_fragmentScriptingPermission(scriptingPermission)
	, m_isParsingFragment(true)
	, m_redirectAttachToFosterParent(false)
	, m_maximumDOMTreeDepth(maximumDOMTreeDepth)
	{
	}

	HTMLConstructionSite::~HTMLConstructionSite()
	{
	}

	void HTMLConstructionSite::detach()
	{
	m_document = 0;
	m_attachmentRoot = 0;
	}

	void HTMLConstructionSite::setForm(HTMLFormElement* form)
	{
	// This method should only be needed for HTMLTreeBuilder in the fragment case.
	ASSERT(!m_form);
	m_form = form;
	}

	PassRefPtr<HTMLFormElement> HTMLConstructionSite::takeForm()
	{
	return m_form.release();
	}

	void HTMLConstructionSite::dispatchDocumentElementAvailableIfNeeded()
	{
	ASSERT(m_document);
	if (m_document->frame() && !m_isParsingFragment)
	m_document->frame()->loader()->dispatchDocumentElementAvailable();
	}

	void HTMLConstructionSite::insertHTMLHtmlStartTagBeforeHTML(AtomicHTMLToken* token)
	{
	RefPtr<HTMLHtmlElement> element = HTMLHtmlElement::create(m_document);
	element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
	attachLater(m_attachmentRoot, element);
	m_openElements.pushHTMLHtmlElement(HTMLStackItem::create(element, token));

	executeQueuedTasks();
	element->insertedByParser();
	dispatchDocumentElementAvailableIfNeeded();
	}

	void HTMLConstructionSite::mergeAttributesFromTokenIntoElement(AtomicHTMLToken* token, Element* element)
	{
	if (token->attributes().isEmpty())
	return;

	ElementAttributeData* elementAttributeData = element->mutableAttributeData();

	for (unsigned i = 0; i < token->attributes().size(); ++i) {
	const Attribute& tokenAttribute = token->attributes().at(i);
	if (!elementAttributeData->getAttributeItem(tokenAttribute.name()))
	element->setAttribute(tokenAttribute.name(), tokenAttribute.value());
	}
	}

	void HTMLConstructionSite::insertHTMLHtmlStartTagInBody(AtomicHTMLToken* token)
	{
	// Fragments do not have a root HTML element, so any additional HTML elements
	// encountered during fragment parsing should be ignored.
	if (m_isParsingFragment)
	return;

	mergeAttributesFromTokenIntoElement(token, m_openElements.htmlElement());
	}

	void HTMLConstructionSite::insertHTMLBodyStartTagInBody(AtomicHTMLToken* token)
	{
	mergeAttributesFromTokenIntoElement(token, m_openElements.bodyElement());
	}

	void HTMLConstructionSite::insertDoctype(AtomicHTMLToken* token)
	{
	ASSERT(token->type() == HTMLTokenTypes::DOCTYPE);

	RefPtr<DocumentType> doctype = DocumentType::create(m_document, token->name(), String::adopt(token->publicIdentifier()), String::adopt(token->systemIdentifier()));
	attachLater(m_attachmentRoot, doctype.release());

	// DOCTYPE nodes are only processed when parsing fragments w/o contextElements, which
	// never occurs. However, if we ever chose to support such, this code is subtly wrong,
	// because context-less fragments can determine their own quirks mode, and thus change
	// parsing rules (like <p> inside <table>). For now we ASSERT that we never hit this code
	// in a fragment, as changing the owning document's compatibility mode would be wrong.
	ASSERT(!m_isParsingFragment);
	if (m_isParsingFragment)
	return;

	if (token->forceQuirks())
	m_document->setCompatibilityMode(Document::QuirksMode);
	else {
	// We need to actually add the Doctype node to the DOM.
	executeQueuedTasks();
	m_document->setCompatibilityModeFromDoctype();
	}
	}

	void HTMLConstructionSite::insertComment(AtomicHTMLToken* token)
	{
	ASSERT(token->type() == HTMLTokenTypes::Comment);
	attachLater(currentNode(), Comment::create(currentNode()->document(), token->comment()));
	}

	void HTMLConstructionSite::insertCommentOnDocument(AtomicHTMLToken* token)
	{
	ASSERT(token->type() == HTMLTokenTypes::Comment);
	attachLater(m_attachmentRoot, Comment::create(m_document, token->comment()));
	}

	void HTMLConstructionSite::insertCommentOnHTMLHtmlElement(AtomicHTMLToken* token)
	{
	ASSERT(token->type() == HTMLTokenTypes::Comment);
	ContainerNode* parent = m_openElements.rootNode();
	attachLater(parent, Comment::create(parent->document(), token->comment()));
	}

	void HTMLConstructionSite::insertHTMLHeadElement(AtomicHTMLToken* token)
	{
	ASSERT(!shouldFosterParent());
	m_head = HTMLStackItem::create(createHTMLElement(token), token);
	attachLater(currentNode(), m_head->element());
	m_openElements.pushHTMLHeadElement(m_head);
	}

	void HTMLConstructionSite::insertHTMLBodyElement(AtomicHTMLToken* token)
	{
	ASSERT(!shouldFosterParent());
	RefPtr<Element> body = createHTMLElement(token);
	attachLater(currentNode(), body);
	m_openElements.pushHTMLBodyElement(HTMLStackItem::create(body.release(), token));
	}

	void HTMLConstructionSite::insertHTMLFormElement(AtomicHTMLToken* token, bool isDemoted)
	{
	RefPtr<Element> element = createHTMLElement(token);
	ASSERT(element->hasTagName(formTag));
	m_form = static_pointer_cast<HTMLFormElement>(element.release());
	m_form->setDemoted(isDemoted);
	attachLater(currentNode(), m_form);
	m_openElements.push(HTMLStackItem::create(m_form, token));
	}

	void HTMLConstructionSite::insertHTMLElement(AtomicHTMLToken* token)
	{
	RefPtr<Element> element = createHTMLElement(token);
	attachLater(currentNode(), element);
	m_openElements.push(HTMLStackItem::create(element.release(), token));
	}

	void HTMLConstructionSite::insertSelfClosingHTMLElement(AtomicHTMLToken* token)
	{
	ASSERT(token->type() == HTMLTokenTypes::StartTag);
	// Normally HTMLElementStack is responsible for calling finishParsingChildren,
	// but self-closing elements are never in the element stack so the stack
	// doesn't get a chance to tell them that we're done parsing their children.
	attachLater(currentNode(), createHTMLElement(token), true);
	// FIXME: Do we want to acknowledge the token's self-closing flag?
	// http://www.whatwg.org/specs/web-apps/current-work/multipage/tokenization.html#acknowledge-self-closing-flag
	}

	void HTMLConstructionSite::insertFormattingElement(AtomicHTMLToken* token)
	{
	// http://www.whatwg.org/specs/web-apps/current-work/multipage/parsing.html#the-stack-of-open-elements
	// Possible active formatting elements include:
	// a, b, big, code, em, font, i, nobr, s, small, strike, strong, tt, and u.
	insertHTMLElement(token);
	m_activeFormattingElements.append(currentElementRecord()->stackItem());
	}

	void HTMLConstructionSite::insertScriptElement(AtomicHTMLToken* token)
	{
	// http://www.whatwg.org/specs/web-apps/current-work/multipage/scripting-1.html#already-started
	// http://html5.org/specs/dom-parsing.html#dom-range-createcontextualfragment
	// For createContextualFragment, the specifications say to mark it parser-inserted and already-started and later unmark them.
	// However, we short circuit that logic to avoid the subtree traversal to find script elements since scripts can never see
	// those flags or effects thereof.
	const bool parserInserted = m_fragmentScriptingPermission != AllowScriptingContentAndDoNotMarkAlreadyStarted;
	const bool alreadyStarted = m_isParsingFragment && parserInserted;
	RefPtr<HTMLScriptElement> element = HTMLScriptElement::create(scriptTag, currentNode()->document(), parserInserted, alreadyStarted);
	if (m_fragmentScriptingPermission != DisallowScriptingContent)
	element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
	attachLater(currentNode(), element);
	m_openElements.push(HTMLStackItem::create(element.release(), token));
	}

	void HTMLConstructionSite::insertForeignElement(AtomicHTMLToken* token, const AtomicString& namespaceURI)
	{
	ASSERT(token->type() == HTMLTokenTypes::StartTag);
	notImplemented(); // parseError when xmlns or xmlns:xlink are wrong.

	RefPtr<Element> element = createElement(token, namespaceURI);
	attachLater(currentNode(), element, token->selfClosing());
	if (!token->selfClosing())
	m_openElements.push(HTMLStackItem::create(element.release(), token, namespaceURI));
	}

	void HTMLConstructionSite::insertTextNode(const String& characters, WhitespaceMode whitespaceMode)
	{
	HTMLConstructionSiteTask task;
	task.parent = currentNode();

	if (shouldFosterParent())
	findFosterSite(task);

	// Strings composed entirely of whitespace are likely to be repeated.
	// Turn them into AtomicString so we share a single string for each.
	bool shouldUseAtomicString = whitespaceMode == AllWhitespace
	\|\| (whitespaceMode == WhitespaceUnknown && isAllWhitespace(characters));

	unsigned currentPosition = 0;

	// FIXME: Splitting text nodes into smaller chunks contradicts HTML5 spec, but is currently necessary
	// for performance, see <https://bugs.webkit.org/show_bug.cgi?id=55898>.

	Node* previousChild = task.nextChild ? task.nextChild->previousSibling() : task.parent->lastChild();
	if (previousChild && previousChild->isTextNode()) {
	// FIXME: We're only supposed to append to this text node if it
	// was the last text node inserted by the parser.
	CharacterData* textNode = static_cast<CharacterData*>(previousChild);
	currentPosition = textNode->parserAppendData(characters, 0, Text::defaultLengthLimit);
	}

	while (currentPosition < characters.length()) {
	RefPtr<Text> textNode = Text::createWithLengthLimit(task.parent->document(), shouldUseAtomicString ? AtomicString(characters).string() : characters, currentPosition);
	// If we have a whole string of unbreakable characters the above could lead to an infinite loop. Exceeding the length limit is the lesser evil.
	if (!textNode->length()) {
	String substring = characters.substring(currentPosition);
	textNode = Text::create(task.parent->document(), shouldUseAtomicString ? AtomicString(substring).string() : substring);
	}

	currentPosition += textNode->length();
	ASSERT(currentPosition <= characters.length());
	task.child = textNode.release();
	executeTask(task);
	}
	}

	PassRefPtr<Element> HTMLConstructionSite::createElement(AtomicHTMLToken* token, const AtomicString& namespaceURI)
	{
	QualifiedName tagName(nullAtom, token->name(), namespaceURI);
	RefPtr<Element> element = currentNode()->document()->createElement(tagName, true);
	element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
	return element.release();
	}

	PassRefPtr<Element> HTMLConstructionSite::createHTMLElement(AtomicHTMLToken* token)
	{
	QualifiedName tagName(nullAtom, token->name(), xhtmlNamespaceURI);
	// FIXME: This can't use HTMLConstructionSite::createElement because we
	// have to pass the current form element. We should rework form association
	// to occur after construction to allow better code sharing here.
	RefPtr<Element> element = HTMLElementFactory::createHTMLElement(tagName, currentNode()->document(), form(), true);
	element->parserSetAttributes(token->attributes(), m_fragmentScriptingPermission);
	ASSERT(element->isHTMLElement());
	return element.release();
	}

	PassRefPtr<HTMLStackItem> HTMLConstructionSite::createElementFromSavedToken(HTMLStackItem* item)
	{
	RefPtr<Element> element;
	if (item->namespaceURI() == HTMLNames::xhtmlNamespaceURI)
	element = createHTMLElement(item->token());
	else
	element = createElement(item->token(), item->namespaceURI());
	return HTMLStackItem::create(element.release(), item->token(), item->namespaceURI());
	}

	bool HTMLConstructionSite::indexOfFirstUnopenFormattingElement(unsigned& firstUnopenElementIndex) const
	{
	if (m_activeFormattingElements.isEmpty())
	return false;
	unsigned index = m_activeFormattingElements.size();
	do {
	--index;
	const HTMLFormattingElementList::Entry& entry = m_activeFormattingElements.at(index);
	if (entry.isMarker() \|\| m_openElements.contains(entry.element())) {
	firstUnopenElementIndex = index + 1;
	return firstUnopenElementIndex < m_activeFormattingElements.size();
	}
	} while (index);
	firstUnopenElementIndex = index;
	return true;
	}

	void HTMLConstructionSite::reconstructTheActiveFormattingElements()
	{
	unsigned firstUnopenElementIndex;
	if (!indexOfFirstUnopenFormattingElement(firstUnopenElementIndex))
	return;

	unsigned unopenEntryIndex = firstUnopenElementIndex;
	ASSERT(unopenEntryIndex < m_activeFormattingElements.size());
	for (; unopenEntryIndex < m_activeFormattingElements.size(); ++unopenEntryIndex) {
	HTMLFormattingElementList::Entry& unopenedEntry = m_activeFormattingElements.at(unopenEntryIndex);
	RefPtr<HTMLStackItem> reconstructed = createElementFromSavedToken(unopenedEntry.stackItem().get());
	attachLater(currentNode(), reconstructed->node());
	m_openElements.push(reconstructed);
	unopenedEntry.replaceElement(reconstructed.release());
	}
	}

	void HTMLConstructionSite::generateImpliedEndTagsWithExclusion(const AtomicString& tagName)
	{
	while (hasImpliedEndTag(currentStackItem()) && !currentStackItem()->hasLocalName(tagName))
	m_openElements.pop();
	}

	void HTMLConstructionSite::generateImpliedEndTags()
	{
	while (hasImpliedEndTag(currentStackItem()))
	m_openElements.pop();
	}

	void HTMLConstructionSite::findFosterSite(HTMLConstructionSiteTask& task)
	{
	HTMLElementStack::ElementRecord* lastTableElementRecord = m_openElements.topmost(tableTag.localName());
	if (lastTableElementRecord) {
	Element* lastTableElement = lastTableElementRecord->element();
	ContainerNode* parent = lastTableElement->parentNode();
	// When parsing HTML fragments, we skip step 4.2 ("Let root be a new html element with no attributes") for efficiency,
	// and instead use the DocumentFragment as a root node. So we must treat the root node (DocumentFragment) as if it is a html element here.
	if (parent && (parent->isElementNode() \|\| (m_isParsingFragment && parent == m_openElements.rootNode()))) {
	task.parent = parent;
	task.nextChild = lastTableElement;
	return;
	}
	task.parent = lastTableElementRecord->next()->element();
	return;
	}
	// Fragment case
	task.parent = m_openElements.rootNode(); // DocumentFragment
	}

	bool HTMLConstructionSite::shouldFosterParent() const
	{
	return m_redirectAttachToFosterParent
	&& currentStackItem()->isElementNode()
	&& currentStackItem()->causesFosterParenting();
	}

	void HTMLConstructionSite::fosterParent(PassRefPtr<Node> node)
	{
	HTMLConstructionSiteTask task;
	findFosterSite(task);
	task.child = node;
	ASSERT(task.parent);
	m_attachmentQueue.append(task);
	}

	}