Source/WebCore/editing/MarkupAccumulator.cpp - platform/external/chromium_org/third_party/WebKit - Git at Google

 /*
  * Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009, 2012 Apple Inc. All rights reserved.
  * Copyright (C) 2009, 2010 Google Inc. All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions
  * are met:
  * 1. Redistributions of source code must retain the above copyright
  *    notice, this list of conditions and the following disclaimer.
  * 2. Redistributions in binary form must reproduce the above copyright
  *    notice, this list of conditions and the following disclaimer in the
  *    documentation and/or other materials provided with the distribution.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */

 #include "config.h"
 #include "MarkupAccumulator.h"

 #include "CDATASection.h"
 #include "Comment.h"
 #include "DocumentFragment.h"
 #include "DocumentType.h"
 #include "Editor.h"
 #include "HTMLElement.h"
 #include "HTMLNames.h"
 #include "HTMLTemplateElement.h"
 #include "KURL.h"
 #include "ProcessingInstruction.h"
 #include "XLinkNames.h"
 #include "XMLNSNames.h"
 #include "XMLNames.h"
 #include <wtf/unicode/CharacterNames.h>

 namespace WebCore {

 using namespace HTMLNames;

 void MarkupAccumulator::appendCharactersReplacingEntities(StringBuilder& result, const String& source, unsigned offset, unsigned length, EntityMask entityMask)
 {
     DEFINE_STATIC_LOCAL(const String, ampReference, (ASCIILiteral("&amp;")));
     DEFINE_STATIC_LOCAL(const String, ltReference, (ASCIILiteral("&lt;")));
     DEFINE_STATIC_LOCAL(const String, gtReference, (ASCIILiteral("&gt;")));
     DEFINE_STATIC_LOCAL(const String, quotReference, (ASCIILiteral("&quot;")));
     DEFINE_STATIC_LOCAL(const String, nbspReference, (ASCIILiteral("&nbsp;")));

     static const EntityDescription entityMaps[] = {
         { '&', ampReference, EntityAmp },
         { '<', ltReference, EntityLt },
         { '>', gtReference, EntityGt },
         { '"', quotReference, EntityQuot },
         { noBreakSpace, nbspReference, EntityNbsp },
     };

     if (!(offset + length))
         return;

     ASSERT(offset + length <= source.length());

     if (source.is8Bit()) {
         const LChar* text = source.characters8() + offset;

         size_t positionAfterLastEntity = 0;
         for (size_t i = 0; i < length; ++i) {
             for (size_t entityIndex = 0; entityIndex < WTF_ARRAY_LENGTH(entityMaps); ++entityIndex) {
                 if (text[i] == entityMaps[entityIndex].entity && entityMaps[entityIndex].mask & entityMask) {
                     result.append(text + positionAfterLastEntity, i - positionAfterLastEntity);
                     result.append(entityMaps[entityIndex].reference);
                     positionAfterLastEntity = i + 1;
                     break;
                 }
             }
         }
         result.append(text + positionAfterLastEntity, length - positionAfterLastEntity);
     } else {
         const UChar* text = source.characters16() + offset;

         size_t positionAfterLastEntity = 0;
         for (size_t i = 0; i < length; ++i) {
             for (size_t entityIndex = 0; entityIndex < WTF_ARRAY_LENGTH(entityMaps); ++entityIndex) {
                 if (text[i] == entityMaps[entityIndex].entity && entityMaps[entityIndex].mask & entityMask) {
                     result.append(text + positionAfterLastEntity, i - positionAfterLastEntity);
                     result.append(entityMaps[entityIndex].reference);
                     positionAfterLastEntity = i + 1;
                     break;
                 }
             }
         }
         result.append(text + positionAfterLastEntity, length - positionAfterLastEntity);
     }
 }

 MarkupAccumulator::MarkupAccumulator(Vector<Node*>* nodes, EAbsoluteURLs resolveUrlsMethod, const Range* range)
     : m_nodes(nodes)
     , m_range(range)
     , m_resolveURLsMethod(resolveUrlsMethod)
 {
 }

 MarkupAccumulator::~MarkupAccumulator()
 {
 }

 String MarkupAccumulator::serializeNodes(Node* targetNode, Node* nodeToSkip, EChildrenOnly childrenOnly)
 {
     return serializeNodes(targetNode, nodeToSkip, childrenOnly, 0);
 }

 String MarkupAccumulator::serializeNodes(Node* targetNode, Node* nodeToSkip, EChildrenOnly childrenOnly, Vector<QualifiedName>* tagNamesToSkip)
 {
     serializeNodesWithNamespaces(targetNode, nodeToSkip, childrenOnly, 0, tagNamesToSkip);
     return m_markup.toString();
 }

 void MarkupAccumulator::serializeNodesWithNamespaces(Node* targetNode, Node* nodeToSkip, EChildrenOnly childrenOnly, const Namespaces* namespaces, Vector<QualifiedName>* tagNamesToSkip)
 {
     if (targetNode == nodeToSkip)
         return;

     if (tagNamesToSkip) {
         for (size_t i = 0; i < tagNamesToSkip->size(); ++i) {
             if (targetNode->hasTagName(tagNamesToSkip->at(i)))
                 return;
         }
     }

     Namespaces namespaceHash;
     if (namespaces)
         namespaceHash = *namespaces;

     if (!childrenOnly)
         appendStartTag(targetNode, &namespaceHash);

     if (!(targetNode->document()->isHTMLDocument() && elementCannotHaveEndTag(targetNode))) {
 #if ENABLE(TEMPLATE_ELEMENT)
         Node* current = targetNode->hasTagName(templateTag) ? toHTMLTemplateElement(targetNode)->content()->firstChild() : targetNode->firstChild();
 #else
         Node* current = targetNode->firstChild();
 #endif
         for ( ; current; current = current->nextSibling())
             serializeNodesWithNamespaces(current, nodeToSkip, IncludeNode, &namespaceHash, tagNamesToSkip);
     }

     if (!childrenOnly)
         appendEndTag(targetNode);
 }

 String MarkupAccumulator::resolveURLIfNeeded(const Element* element, const String& urlString) const
 {
     switch (m_resolveURLsMethod) {
     case ResolveAllURLs:
         return element->document()->completeURL(urlString).string();

     case ResolveNonLocalURLs:
         if (!element->document()->url().isLocalFile())
             return element->document()->completeURL(urlString).string();
         break;

     case DoNotResolveURLs:
         break;
     }
     return urlString;
 }

 void MarkupAccumulator::appendString(const String& string)
 {
     m_markup.append(string);
 }

 void MarkupAccumulator::appendStartTag(Node* node, Namespaces* namespaces)
 {
     appendStartMarkup(m_markup, node, namespaces);
     if (m_nodes)
         m_nodes->append(node);
 }

 void MarkupAccumulator::appendEndTag(Node* node)
 {
     appendEndMarkup(m_markup, node);
 }

 size_t MarkupAccumulator::totalLength(const Vector<String>& strings)
 {
     size_t length = 0;
     for (size_t i = 0; i < strings.size(); ++i)
         length += strings[i].length();
     return length;
 }

 void MarkupAccumulator::concatenateMarkup(StringBuilder& result)
 {
     result.append(m_markup);
 }

 void MarkupAccumulator::appendAttributeValue(StringBuilder& result, const String& attribute, bool documentIsHTML)
 {
     appendCharactersReplacingEntities(result, attribute, 0, attribute.length(),
         documentIsHTML ? EntityMaskInHTMLAttributeValue : EntityMaskInAttributeValue);
 }

 void MarkupAccumulator::appendCustomAttributes(StringBuilder&, Element*, Namespaces*)
 {
 }

 void MarkupAccumulator::appendQuotedURLAttributeValue(StringBuilder& result, const Element* element, const Attribute& attribute)
 {
     ASSERT(element->isURLAttribute(attribute));
     const String resolvedURLString = resolveURLIfNeeded(element, attribute.value());
     UChar quoteChar = '"';
     String strippedURLString = resolvedURLString.stripWhiteSpace();
     if (protocolIsJavaScript(strippedURLString)) {
         // minimal escaping for javascript urls
         if (strippedURLString.contains('"')) {
             if (strippedURLString.contains('\''))
                 strippedURLString.replaceWithLiteral('"', "&quot;");
             else
                 quoteChar = '\'';
         }
         result.append(quoteChar);
         result.append(strippedURLString);
         result.append(quoteChar);
         return;
     }

     // FIXME: This does not fully match other browsers. Firefox percent-escapes non-ASCII characters for innerHTML.
     result.append(quoteChar);
     appendAttributeValue(result, resolvedURLString, false);
     result.append(quoteChar);
 }

 void MarkupAccumulator::appendNodeValue(StringBuilder& result, const Node* node, const Range* range, EntityMask entityMask)
 {
     const String str = node->nodeValue();
     unsigned length = str.length();
     unsigned start = 0;

     if (range) {
         if (node == range->endContainer())
             length = range->endOffset();
         if (node == range->startContainer()) {
             start = range->startOffset();
             length -= start;
         }
     }

     appendCharactersReplacingEntities(result, str, start, length, entityMask);
 }

 bool MarkupAccumulator::shouldAddNamespaceElement(const Element* element)
 {
     // Don't add namespace attribute if it is already defined for this elem.
     const AtomicString& prefix = element->prefix();
     if (prefix.isEmpty())
         return !element->hasAttribute(xmlnsAtom);

     DEFINE_STATIC_LOCAL(String, xmlnsWithColon, (ASCIILiteral("xmlns:")));
     return !element->hasAttribute(xmlnsWithColon + prefix);
 }

 bool MarkupAccumulator::shouldAddNamespaceAttribute(const Attribute& attribute, Namespaces& namespaces)
 {
     namespaces.checkConsistency();

     // Don't add namespace attributes twice
     if (attribute.name() == XMLNSNames::xmlnsAttr) {
         namespaces.set(emptyAtom.impl(), attribute.value().impl());
         return false;
     }

     QualifiedName xmlnsPrefixAttr(xmlnsAtom, attribute.localName(), XMLNSNames::xmlnsNamespaceURI);
     if (attribute.name() == xmlnsPrefixAttr) {
         namespaces.set(attribute.localName().impl(), attribute.value().impl());
         return false;
     }

     return true;
 }

 void MarkupAccumulator::appendNamespace(StringBuilder& result, const AtomicString& prefix, const AtomicString& namespaceURI, Namespaces& namespaces)
 {
     namespaces.checkConsistency();
     if (namespaceURI.isEmpty())
         return;

     // Use emptyAtoms's impl() for both null and empty strings since the HashMap can't handle 0 as a key
     AtomicStringImpl* pre = prefix.isEmpty() ? emptyAtom.impl() : prefix.impl();
     AtomicStringImpl* foundNS = namespaces.get(pre);
     if (foundNS != namespaceURI.impl()) {
         namespaces.set(pre, namespaceURI.impl());
         result.append(' ');
         result.append(xmlnsAtom.string());
         if (!prefix.isEmpty()) {
             result.append(':');
             result.append(prefix);
         }

         result.append('=');
         result.append('"');
         appendAttributeValue(result, namespaceURI, false);
         result.append('"');
     }
 }

 EntityMask MarkupAccumulator::entityMaskForText(Text* text) const
 {
     const QualifiedName* parentName = 0;
     if (text->parentElement())
         parentName = &(text->parentElement())->tagQName();

     if (parentName && (*parentName == scriptTag || *parentName == styleTag || *parentName == xmpTag))
         return EntityMaskInCDATA;

     return text->document()->isHTMLDocument() ? EntityMaskInHTMLPCDATA : EntityMaskInPCDATA;
 }

 void MarkupAccumulator::appendText(StringBuilder& result, Text* text)
 {
     appendNodeValue(result, text, m_range, entityMaskForText(text));
 }

 void MarkupAccumulator::appendComment(StringBuilder& result, const String& comment)
 {
     // FIXME: Comment content is not escaped, but XMLSerializer (and possibly other callers) should raise an exception if it includes "-->".
     result.appendLiteral("<!--");
     result.append(comment);
     result.appendLiteral("-->");
 }

 void MarkupAccumulator::appendXMLDeclaration(StringBuilder& result, const Document* document)
 {
     if (!document->hasXMLDeclaration())
         return;

     result.appendLiteral("<?xml version=\"");
     result.append(document->xmlVersion());
     const String& encoding = document->xmlEncoding();
     if (!encoding.isEmpty()) {
         result.appendLiteral("\" encoding=\"");
         result.append(encoding);
     }
     if (document->xmlStandaloneStatus() != Document::StandaloneUnspecified) {
         result.appendLiteral("\" standalone=\"");
         if (document->xmlStandalone())
             result.appendLiteral("yes");
         else
             result.appendLiteral("no");
     }

     result.appendLiteral("\"?>");
 }

 void MarkupAccumulator::appendDocumentType(StringBuilder& result, const DocumentType* n)
 {
     if (n->name().isEmpty())
         return;

     result.appendLiteral("<!DOCTYPE ");
     result.append(n->name());
     if (!n->publicId().isEmpty()) {
         result.appendLiteral(" PUBLIC \"");
         result.append(n->publicId());
         result.append('"');
         if (!n->systemId().isEmpty()) {
             result.append(' ');
             result.append('"');
             result.append(n->systemId());
             result.append('"');
         }
     } else if (!n->systemId().isEmpty()) {
         result.appendLiteral(" SYSTEM \"");
         result.append(n->systemId());
         result.append('"');
     }
     if (!n->internalSubset().isEmpty()) {
         result.append(' ');
         result.append('[');
         result.append(n->internalSubset());
         result.append(']');
     }
     result.append('>');
 }

 void MarkupAccumulator::appendProcessingInstruction(StringBuilder& result, const String& target, const String& data)
 {
     // FIXME: PI data is not escaped, but XMLSerializer (and possibly other callers) this should raise an exception if it includes "?>".
     result.append('<');
     result.append('?');
     result.append(target);
     result.append(' ');
     result.append(data);
     result.append('?');
     result.append('>');
 }

 void MarkupAccumulator::appendElement(StringBuilder& result, Element* element, Namespaces* namespaces)
 {
     appendOpenTag(result, element, namespaces);

     if (element->hasAttributes()) {
         unsigned length = element->attributeCount();
         for (unsigned int i = 0; i < length; i++)
             appendAttribute(result, element, *element->attributeItem(i), namespaces);
     }

     // Give an opportunity to subclasses to add their own attributes.
     appendCustomAttributes(result, element, namespaces);

     appendCloseTag(result, element);
 }

 void MarkupAccumulator::appendOpenTag(StringBuilder& result, Element* element, Namespaces* namespaces)
 {
     result.append('<');
     result.append(element->nodeNamePreservingCase());
     if (!element->document()->isHTMLDocument() && namespaces && shouldAddNamespaceElement(element))
         appendNamespace(result, element->prefix(), element->namespaceURI(), *namespaces);
 }

 void MarkupAccumulator::appendCloseTag(StringBuilder& result, Element* element)
 {
     if (shouldSelfClose(element)) {
         if (element->isHTMLElement())
             result.append(' '); // XHTML 1.0 <-> HTML compatibility.
         result.append('/');
     }
     result.append('>');
 }

 static inline bool attributeIsInSerializedNamespace(const Attribute& attribute)
 {
     return attribute.namespaceURI() == XMLNames::xmlNamespaceURI
         || attribute.namespaceURI() == XLinkNames::xlinkNamespaceURI
         || attribute.namespaceURI() == XMLNSNames::xmlnsNamespaceURI;
 }

 void MarkupAccumulator::appendAttribute(StringBuilder& result, Element* element, const Attribute& attribute, Namespaces* namespaces)
 {
     bool documentIsHTML = element->document()->isHTMLDocument();

     result.append(' ');

     if (documentIsHTML && !attributeIsInSerializedNamespace(attribute))
         result.append(attribute.name().localName());
     else {
         QualifiedName prefixedName = attribute.name();
         if (attribute.namespaceURI() == XLinkNames::xlinkNamespaceURI) {
             if (!attribute.prefix())
                 prefixedName.setPrefix(xlinkAtom);
         } else if (attribute.namespaceURI() == XMLNames::xmlNamespaceURI) {
             if (!attribute.prefix())
                 prefixedName.setPrefix(xmlAtom);
         } else if (attribute.namespaceURI() == XMLNSNames::xmlnsNamespaceURI) {
             if (attribute.name() != XMLNSNames::xmlnsAttr && !attribute.prefix())
                 prefixedName.setPrefix(xmlnsAtom);
         }
         result.append(prefixedName.toString());
     }

     result.append('=');

     if (element->isURLAttribute(attribute))
         appendQuotedURLAttributeValue(result, element, attribute);
     else {
         result.append('"');
         appendAttributeValue(result, attribute.value(), documentIsHTML);
         result.append('"');
     }

     if (!documentIsHTML && namespaces && shouldAddNamespaceAttribute(attribute, *namespaces))
         appendNamespace(result, attribute.prefix(), attribute.namespaceURI(), *namespaces);
 }

 void MarkupAccumulator::appendCDATASection(StringBuilder& result, const String& section)
 {
     // FIXME: CDATA content is not escaped, but XMLSerializer (and possibly other callers) should raise an exception if it includes "]]>".
     result.appendLiteral("<![CDATA[");
     result.append(section);
     result.appendLiteral("]]>");
 }

 void MarkupAccumulator::appendStartMarkup(StringBuilder& result, const Node* node, Namespaces* namespaces)
 {
     if (namespaces)
         namespaces->checkConsistency();

     switch (node->nodeType()) {
     case Node::TEXT_NODE:
         appendText(result, toText(const_cast<Node*>(node)));
         break;
     case Node::COMMENT_NODE:
         appendComment(result, static_cast<const Comment*>(node)->data());
         break;
     case Node::DOCUMENT_NODE:
         appendXMLDeclaration(result, toDocument(node));
         break;
     case Node::DOCUMENT_FRAGMENT_NODE:
         break;
     case Node::DOCUMENT_TYPE_NODE:
         appendDocumentType(result, static_cast<const DocumentType*>(node));
         break;
     case Node::PROCESSING_INSTRUCTION_NODE:
         appendProcessingInstruction(result, static_cast<const ProcessingInstruction*>(node)->target(), static_cast<const ProcessingInstruction*>(node)->data());
         break;
     case Node::ELEMENT_NODE:
         appendElement(result, toElement(const_cast<Node*>(node)), namespaces);
         break;
     case Node::CDATA_SECTION_NODE:
         appendCDATASection(result, static_cast<const CDATASection*>(node)->data());
         break;
     case Node::ATTRIBUTE_NODE:
     case Node::ENTITY_NODE:
     case Node::ENTITY_REFERENCE_NODE:
     case Node::NOTATION_NODE:
     case Node::XPATH_NAMESPACE_NODE:
         ASSERT_NOT_REACHED();
         break;
     }
 }

 // Rules of self-closure
 // 1. No elements in HTML documents use the self-closing syntax.
 // 2. Elements w/ children never self-close because they use a separate end tag.
 // 3. HTML elements which do not have a "forbidden" end tag will close with a separate end tag.
 // 4. Other elements self-close.
 bool MarkupAccumulator::shouldSelfClose(const Node* node)
 {
     if (node->document()->isHTMLDocument())
         return false;
     if (node->hasChildNodes())
         return false;
     if (node->isHTMLElement() && !elementCannotHaveEndTag(node))
         return false;
     return true;
 }

 bool MarkupAccumulator::elementCannotHaveEndTag(const Node* node)
 {
     if (!node->isHTMLElement())
         return false;

     // FIXME: ieForbidsInsertHTML may not be the right function to call here
     // ieForbidsInsertHTML is used to disallow setting innerHTML/outerHTML
     // or createContextualFragment.  It does not necessarily align with
     // which elements should be serialized w/o end tags.
     return static_cast<const HTMLElement*>(node)->ieForbidsInsertHTML();
 }

 void MarkupAccumulator::appendEndMarkup(StringBuilder& result, const Node* node)
 {
     if (!node->isElementNode() || shouldSelfClose(node) || (!node->hasChildNodes() && elementCannotHaveEndTag(node)))
         return;

     result.append('<');
     result.append('/');
     result.append(toElement(node)->nodeNamePreservingCase());
     result.append('>');
 }

 }
	/*
	* Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009, 2012 Apple Inc. All rights reserved.
	* Copyright (C) 2009, 2010 Google Inc. All rights reserved.
	*
	* Redistribution and use in source and binary forms, with or without
	* modification, are permitted provided that the following conditions
	* are met:
	* 1. Redistributions of source code must retain the above copyright
	* notice, this list of conditions and the following disclaimer.
	* 2. Redistributions in binary form must reproduce the above copyright
	* notice, this list of conditions and the following disclaimer in the
	* documentation and/or other materials provided with the distribution.
	*
	* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
	*/

	#include "config.h"
	#include "MarkupAccumulator.h"

	#include "CDATASection.h"
	#include "Comment.h"
	#include "DocumentFragment.h"
	#include "DocumentType.h"
	#include "Editor.h"
	#include "HTMLElement.h"
	#include "HTMLNames.h"
	#include "HTMLTemplateElement.h"
	#include "KURL.h"
	#include "ProcessingInstruction.h"
	#include "XLinkNames.h"
	#include "XMLNSNames.h"
	#include "XMLNames.h"
	#include <wtf/unicode/CharacterNames.h>

	namespace WebCore {

	using namespace HTMLNames;

	void MarkupAccumulator::appendCharactersReplacingEntities(StringBuilder& result, const String& source, unsigned offset, unsigned length, EntityMask entityMask)
	{
	DEFINE_STATIC_LOCAL(const String, ampReference, (ASCIILiteral("&")));
	DEFINE_STATIC_LOCAL(const String, ltReference, (ASCIILiteral("<")));
	DEFINE_STATIC_LOCAL(const String, gtReference, (ASCIILiteral(">")));
	DEFINE_STATIC_LOCAL(const String, quotReference, (ASCIILiteral(""")));
	DEFINE_STATIC_LOCAL(const String, nbspReference, (ASCIILiteral(" ")));

	static const EntityDescription entityMaps[] = {
	{ '&', ampReference, EntityAmp },
	{ '<', ltReference, EntityLt },
	{ '>', gtReference, EntityGt },
	{ '"', quotReference, EntityQuot },
	{ noBreakSpace, nbspReference, EntityNbsp },
	};

	if (!(offset + length))
	return;

	ASSERT(offset + length <= source.length());

	if (source.is8Bit()) {
	const LChar* text = source.characters8() + offset;

	size_t positionAfterLastEntity = 0;
	for (size_t i = 0; i < length; ++i) {
	for (size_t entityIndex = 0; entityIndex < WTF_ARRAY_LENGTH(entityMaps); ++entityIndex) {
	if (text[i] == entityMaps[entityIndex].entity && entityMaps[entityIndex].mask & entityMask) {
	result.append(text + positionAfterLastEntity, i - positionAfterLastEntity);
	result.append(entityMaps[entityIndex].reference);
	positionAfterLastEntity = i + 1;
	break;
	}
	}
	}
	result.append(text + positionAfterLastEntity, length - positionAfterLastEntity);
	} else {
	const UChar* text = source.characters16() + offset;

	size_t positionAfterLastEntity = 0;
	for (size_t i = 0; i < length; ++i) {
	for (size_t entityIndex = 0; entityIndex < WTF_ARRAY_LENGTH(entityMaps); ++entityIndex) {
	if (text[i] == entityMaps[entityIndex].entity && entityMaps[entityIndex].mask & entityMask) {
	result.append(text + positionAfterLastEntity, i - positionAfterLastEntity);
	result.append(entityMaps[entityIndex].reference);
	positionAfterLastEntity = i + 1;
	break;
	}
	}
	}
	result.append(text + positionAfterLastEntity, length - positionAfterLastEntity);
	}
	}

	MarkupAccumulator::MarkupAccumulator(Vector<Node> nodes, EAbsoluteURLs resolveUrlsMethod, const Range* range)
	: m_nodes(nodes)
	, m_range(range)
	, m_resolveURLsMethod(resolveUrlsMethod)
	{
	}

	MarkupAccumulator::~MarkupAccumulator()
	{
	}

	String MarkupAccumulator::serializeNodes(Node* targetNode, Node* nodeToSkip, EChildrenOnly childrenOnly)
	{
	return serializeNodes(targetNode, nodeToSkip, childrenOnly, 0);
	}

	String MarkupAccumulator::serializeNodes(Node* targetNode, Node* nodeToSkip, EChildrenOnly childrenOnly, Vector<QualifiedName>* tagNamesToSkip)
	{
	serializeNodesWithNamespaces(targetNode, nodeToSkip, childrenOnly, 0, tagNamesToSkip);
	return m_markup.toString();
	}

	void MarkupAccumulator::serializeNodesWithNamespaces(Node* targetNode, Node* nodeToSkip, EChildrenOnly childrenOnly, const Namespaces* namespaces, Vector<QualifiedName>* tagNamesToSkip)
	{
	if (targetNode == nodeToSkip)
	return;

	if (tagNamesToSkip) {
	for (size_t i = 0; i < tagNamesToSkip->size(); ++i) {
	if (targetNode->hasTagName(tagNamesToSkip->at(i)))
	return;
	}
	}

	Namespaces namespaceHash;
	if (namespaces)
	namespaceHash = *namespaces;

	if (!childrenOnly)
	appendStartTag(targetNode, &namespaceHash);

	if (!(targetNode->document()->isHTMLDocument() && elementCannotHaveEndTag(targetNode))) {
	#if ENABLE(TEMPLATE_ELEMENT)
	Node* current = targetNode->hasTagName(templateTag) ? toHTMLTemplateElement(targetNode)->content()->firstChild() : targetNode->firstChild();
	#else
	Node* current = targetNode->firstChild();
	#endif
	for ( ; current; current = current->nextSibling())
	serializeNodesWithNamespaces(current, nodeToSkip, IncludeNode, &namespaceHash, tagNamesToSkip);
	}

	if (!childrenOnly)
	appendEndTag(targetNode);
	}

	String MarkupAccumulator::resolveURLIfNeeded(const Element* element, const String& urlString) const
	{
	switch (m_resolveURLsMethod) {
	case ResolveAllURLs:
	return element->document()->completeURL(urlString).string();

	case ResolveNonLocalURLs:
	if (!element->document()->url().isLocalFile())
	return element->document()->completeURL(urlString).string();
	break;

	case DoNotResolveURLs:
	break;
	}
	return urlString;
	}

	void MarkupAccumulator::appendString(const String& string)
	{
	m_markup.append(string);
	}

	void MarkupAccumulator::appendStartTag(Node* node, Namespaces* namespaces)
	{
	appendStartMarkup(m_markup, node, namespaces);
	if (m_nodes)
	m_nodes->append(node);
	}

	void MarkupAccumulator::appendEndTag(Node* node)
	{
	appendEndMarkup(m_markup, node);
	}

	size_t MarkupAccumulator::totalLength(const Vector<String>& strings)
	{
	size_t length = 0;
	for (size_t i = 0; i < strings.size(); ++i)
	length += strings[i].length();
	return length;
	}

	void MarkupAccumulator::concatenateMarkup(StringBuilder& result)
	{
	result.append(m_markup);
	}

	void MarkupAccumulator::appendAttributeValue(StringBuilder& result, const String& attribute, bool documentIsHTML)
	{
	appendCharactersReplacingEntities(result, attribute, 0, attribute.length(),
	documentIsHTML ? EntityMaskInHTMLAttributeValue : EntityMaskInAttributeValue);
	}

	void MarkupAccumulator::appendCustomAttributes(StringBuilder&, Element, Namespaces)
	{
	}

	void MarkupAccumulator::appendQuotedURLAttributeValue(StringBuilder& result, const Element* element, const Attribute& attribute)
	{
	ASSERT(element->isURLAttribute(attribute));
	const String resolvedURLString = resolveURLIfNeeded(element, attribute.value());
	UChar quoteChar = '"';
	String strippedURLString = resolvedURLString.stripWhiteSpace();
	if (protocolIsJavaScript(strippedURLString)) {
	// minimal escaping for javascript urls
	if (strippedURLString.contains('"')) {
	if (strippedURLString.contains('\''))
	strippedURLString.replaceWithLiteral('"', """);
	else
	quoteChar = '\'';
	}
	result.append(quoteChar);
	result.append(strippedURLString);
	result.append(quoteChar);
	return;
	}

	// FIXME: This does not fully match other browsers. Firefox percent-escapes non-ASCII characters for innerHTML.
	result.append(quoteChar);
	appendAttributeValue(result, resolvedURLString, false);
	result.append(quoteChar);
	}

	void MarkupAccumulator::appendNodeValue(StringBuilder& result, const Node* node, const Range* range, EntityMask entityMask)
	{
	const String str = node->nodeValue();
	unsigned length = str.length();
	unsigned start = 0;

	if (range) {
	if (node == range->endContainer())
	length = range->endOffset();
	if (node == range->startContainer()) {
	start = range->startOffset();
	length -= start;
	}
	}

	appendCharactersReplacingEntities(result, str, start, length, entityMask);
	}

	bool MarkupAccumulator::shouldAddNamespaceElement(const Element* element)
	{
	// Don't add namespace attribute if it is already defined for this elem.
	const AtomicString& prefix = element->prefix();
	if (prefix.isEmpty())
	return !element->hasAttribute(xmlnsAtom);

	DEFINE_STATIC_LOCAL(String, xmlnsWithColon, (ASCIILiteral("xmlns:")));
	return !element->hasAttribute(xmlnsWithColon + prefix);
	}

	bool MarkupAccumulator::shouldAddNamespaceAttribute(const Attribute& attribute, Namespaces& namespaces)
	{
	namespaces.checkConsistency();

	// Don't add namespace attributes twice
	if (attribute.name() == XMLNSNames::xmlnsAttr) {
	namespaces.set(emptyAtom.impl(), attribute.value().impl());
	return false;
	}

	QualifiedName xmlnsPrefixAttr(xmlnsAtom, attribute.localName(), XMLNSNames::xmlnsNamespaceURI);
	if (attribute.name() == xmlnsPrefixAttr) {
	namespaces.set(attribute.localName().impl(), attribute.value().impl());
	return false;
	}

	return true;
	}

	void MarkupAccumulator::appendNamespace(StringBuilder& result, const AtomicString& prefix, const AtomicString& namespaceURI, Namespaces& namespaces)
	{
	namespaces.checkConsistency();
	if (namespaceURI.isEmpty())
	return;

	// Use emptyAtoms's impl() for both null and empty strings since the HashMap can't handle 0 as a key
	AtomicStringImpl* pre = prefix.isEmpty() ? emptyAtom.impl() : prefix.impl();
	AtomicStringImpl* foundNS = namespaces.get(pre);
	if (foundNS != namespaceURI.impl()) {
	namespaces.set(pre, namespaceURI.impl());
	result.append(' ');
	result.append(xmlnsAtom.string());
	if (!prefix.isEmpty()) {
	result.append(':');
	result.append(prefix);
	}

	result.append('=');
	result.append('"');
	appendAttributeValue(result, namespaceURI, false);
	result.append('"');
	}
	}

	EntityMask MarkupAccumulator::entityMaskForText(Text* text) const
	{
	const QualifiedName* parentName = 0;
	if (text->parentElement())
	parentName = &(text->parentElement())->tagQName();

	if (parentName && (parentName == scriptTag \|\| parentName == styleTag \|\| *parentName == xmpTag))
	return EntityMaskInCDATA;

	return text->document()->isHTMLDocument() ? EntityMaskInHTMLPCDATA : EntityMaskInPCDATA;
	}

	void MarkupAccumulator::appendText(StringBuilder& result, Text* text)
	{
	appendNodeValue(result, text, m_range, entityMaskForText(text));
	}

	void MarkupAccumulator::appendComment(StringBuilder& result, const String& comment)
	{
	// FIXME: Comment content is not escaped, but XMLSerializer (and possibly other callers) should raise an exception if it includes "-->".
	result.appendLiteral("<!--");
	result.append(comment);
	result.appendLiteral("-->");
	}

	void MarkupAccumulator::appendXMLDeclaration(StringBuilder& result, const Document* document)
	{
	if (!document->hasXMLDeclaration())
	return;

	result.appendLiteral("<?xml version=\"");
	result.append(document->xmlVersion());
	const String& encoding = document->xmlEncoding();
	if (!encoding.isEmpty()) {
	result.appendLiteral("\" encoding=\"");
	result.append(encoding);
	}
	if (document->xmlStandaloneStatus() != Document::StandaloneUnspecified) {
	result.appendLiteral("\" standalone=\"");
	if (document->xmlStandalone())
	result.appendLiteral("yes");
	else
	result.appendLiteral("no");
	}

	result.appendLiteral("\"?>");
	}

	void MarkupAccumulator::appendDocumentType(StringBuilder& result, const DocumentType* n)
	{
	if (n->name().isEmpty())
	return;

	result.appendLiteral("<!DOCTYPE ");
	result.append(n->name());
	if (!n->publicId().isEmpty()) {
	result.appendLiteral(" PUBLIC \"");
	result.append(n->publicId());
	result.append('"');
	if (!n->systemId().isEmpty()) {
	result.append(' ');
	result.append('"');
	result.append(n->systemId());
	result.append('"');
	}
	} else if (!n->systemId().isEmpty()) {
	result.appendLiteral(" SYSTEM \"");
	result.append(n->systemId());
	result.append('"');
	}
	if (!n->internalSubset().isEmpty()) {
	result.append(' ');
	result.append('[');
	result.append(n->internalSubset());
	result.append(']');
	}
	result.append('>');
	}

	void MarkupAccumulator::appendProcessingInstruction(StringBuilder& result, const String& target, const String& data)
	{
	// FIXME: PI data is not escaped, but XMLSerializer (and possibly other callers) this should raise an exception if it includes "?>".
	result.append('<');
	result.append('?');
	result.append(target);
	result.append(' ');
	result.append(data);
	result.append('?');
	result.append('>');
	}

	void MarkupAccumulator::appendElement(StringBuilder& result, Element* element, Namespaces* namespaces)
	{
	appendOpenTag(result, element, namespaces);

	if (element->hasAttributes()) {
	unsigned length = element->attributeCount();
	for (unsigned int i = 0; i < length; i++)
	appendAttribute(result, element, *element->attributeItem(i), namespaces);
	}

	// Give an opportunity to subclasses to add their own attributes.
	appendCustomAttributes(result, element, namespaces);

	appendCloseTag(result, element);
	}

	void MarkupAccumulator::appendOpenTag(StringBuilder& result, Element* element, Namespaces* namespaces)
	{
	result.append('<');
	result.append(element->nodeNamePreservingCase());
	if (!element->document()->isHTMLDocument() && namespaces && shouldAddNamespaceElement(element))
	appendNamespace(result, element->prefix(), element->namespaceURI(), *namespaces);
	}

	void MarkupAccumulator::appendCloseTag(StringBuilder& result, Element* element)
	{
	if (shouldSelfClose(element)) {
	if (element->isHTMLElement())
	result.append(' '); // XHTML 1.0 <-> HTML compatibility.
	result.append('/');
	}
	result.append('>');
	}

	static inline bool attributeIsInSerializedNamespace(const Attribute& attribute)
	{
	return attribute.namespaceURI() == XMLNames::xmlNamespaceURI
	\|\| attribute.namespaceURI() == XLinkNames::xlinkNamespaceURI
	\|\| attribute.namespaceURI() == XMLNSNames::xmlnsNamespaceURI;
	}

	void MarkupAccumulator::appendAttribute(StringBuilder& result, Element* element, const Attribute& attribute, Namespaces* namespaces)
	{
	bool documentIsHTML = element->document()->isHTMLDocument();

	result.append(' ');

	if (documentIsHTML && !attributeIsInSerializedNamespace(attribute))
	result.append(attribute.name().localName());
	else {
	QualifiedName prefixedName = attribute.name();
	if (attribute.namespaceURI() == XLinkNames::xlinkNamespaceURI) {
	if (!attribute.prefix())
	prefixedName.setPrefix(xlinkAtom);
	} else if (attribute.namespaceURI() == XMLNames::xmlNamespaceURI) {
	if (!attribute.prefix())
	prefixedName.setPrefix(xmlAtom);
	} else if (attribute.namespaceURI() == XMLNSNames::xmlnsNamespaceURI) {
	if (attribute.name() != XMLNSNames::xmlnsAttr && !attribute.prefix())
	prefixedName.setPrefix(xmlnsAtom);
	}
	result.append(prefixedName.toString());
	}

	result.append('=');

	if (element->isURLAttribute(attribute))
	appendQuotedURLAttributeValue(result, element, attribute);
	else {
	result.append('"');
	appendAttributeValue(result, attribute.value(), documentIsHTML);
	result.append('"');
	}

	if (!documentIsHTML && namespaces && shouldAddNamespaceAttribute(attribute, *namespaces))
	appendNamespace(result, attribute.prefix(), attribute.namespaceURI(), *namespaces);
	}

	void MarkupAccumulator::appendCDATASection(StringBuilder& result, const String& section)
	{
	// FIXME: CDATA content is not escaped, but XMLSerializer (and possibly other callers) should raise an exception if it includes "]]>".
	result.appendLiteral("<![CDATA[");
	result.append(section);
	result.appendLiteral("]]>");
	}

	void MarkupAccumulator::appendStartMarkup(StringBuilder& result, const Node* node, Namespaces* namespaces)
	{
	if (namespaces)
	namespaces->checkConsistency();

	switch (node->nodeType()) {
	case Node::TEXT_NODE:
	appendText(result, toText(const_cast<Node*>(node)));
	break;
	case Node::COMMENT_NODE:
	appendComment(result, static_cast<const Comment*>(node)->data());
	break;
	case Node::DOCUMENT_NODE:
	appendXMLDeclaration(result, toDocument(node));
	break;
	case Node::DOCUMENT_FRAGMENT_NODE:
	break;
	case Node::DOCUMENT_TYPE_NODE:
	appendDocumentType(result, static_cast<const DocumentType*>(node));
	break;
	case Node::PROCESSING_INSTRUCTION_NODE:
	appendProcessingInstruction(result, static_cast<const ProcessingInstruction>(node)->target(), static_cast<const ProcessingInstruction>(node)->data());
	break;
	case Node::ELEMENT_NODE:
	appendElement(result, toElement(const_cast<Node*>(node)), namespaces);
	break;
	case Node::CDATA_SECTION_NODE:
	appendCDATASection(result, static_cast<const CDATASection*>(node)->data());
	break;
	case Node::ATTRIBUTE_NODE:
	case Node::ENTITY_NODE:
	case Node::ENTITY_REFERENCE_NODE:
	case Node::NOTATION_NODE:
	case Node::XPATH_NAMESPACE_NODE:
	ASSERT_NOT_REACHED();
	break;
	}
	}

	// Rules of self-closure
	// 1. No elements in HTML documents use the self-closing syntax.
	// 2. Elements w/ children never self-close because they use a separate end tag.
	// 3. HTML elements which do not have a "forbidden" end tag will close with a separate end tag.
	// 4. Other elements self-close.
	bool MarkupAccumulator::shouldSelfClose(const Node* node)
	{
	if (node->document()->isHTMLDocument())
	return false;
	if (node->hasChildNodes())
	return false;
	if (node->isHTMLElement() && !elementCannotHaveEndTag(node))
	return false;
	return true;
	}

	bool MarkupAccumulator::elementCannotHaveEndTag(const Node* node)
	{
	if (!node->isHTMLElement())
	return false;

	// FIXME: ieForbidsInsertHTML may not be the right function to call here
	// ieForbidsInsertHTML is used to disallow setting innerHTML/outerHTML
	// or createContextualFragment. It does not necessarily align with
	// which elements should be serialized w/o end tags.
	return static_cast<const HTMLElement*>(node)->ieForbidsInsertHTML();
	}

	void MarkupAccumulator::appendEndMarkup(StringBuilder& result, const Node* node)
	{
	if (!node->isElementNode() \|\| shouldSelfClose(node) \|\| (!node->hasChildNodes() && elementCannotHaveEndTag(node)))
	return;

	result.append('<');
	result.append('/');
	result.append(toElement(node)->nodeNamePreservingCase());
	result.append('>');
	}

	}