ChangeLog

112013-02-11 Eric Seidel <eric@webkit.org>

        Fold MarkupTokenBase into HTMLToken now that it has no other subclasses

        https://bugs.webkit.org/show_bug.cgi?id=109483

        Reviewed by NOBODY (OOPS!).

        This deletes an epic amount of template yuck, as well as removes

        a vtable !?! from HTMLToken.

        This paves the way for further cleanup of HTMLToken now that we

        can see the whole object at once.

        We'll also probably re-create an HTMLToken.cpp again, now that we're

        free from the chains of template nonsense.

        * GNUmakefile.list.am:

        * Target.pri:

        * WebCore.gypi:

        * WebCore.vcproj/WebCore.vcproj:

        * WebCore.vcxproj/WebCore.vcxproj:

        * WebCore.vcxproj/WebCore.vcxproj.filters:

        * WebCore.xcodeproj/project.pbxproj:

        * html/parser/HTMLToken.h:

        (WebCore::findAttributeInVector):

        (WebCore):

        (HTMLToken):

        (Attribute):

        (Range):

        (WebCore::HTMLToken::HTMLToken):

        (WebCore::HTMLToken::clear):

        (WebCore::HTMLToken::isUninitialized):

        (WebCore::HTMLToken::type):

        (WebCore::HTMLToken::makeEndOfFile):

        (WebCore::HTMLToken::startIndex):

        (WebCore::HTMLToken::endIndex):

        (WebCore::HTMLToken::setBaseOffset):

        (WebCore::HTMLToken::end):

        (WebCore::HTMLToken::data):

        (WebCore::HTMLToken::isAll8BitData):

        (WebCore::HTMLToken::name):

        (WebCore::HTMLToken::appendToName):

        (WebCore::HTMLToken::nameString):

        (WebCore::HTMLToken::selfClosing):

        (WebCore::HTMLToken::setSelfClosing):

        (WebCore::HTMLToken::beginStartTag):

        (WebCore::HTMLToken::beginEndTag):

        (WebCore::HTMLToken::addNewAttribute):

        (WebCore::HTMLToken::beginAttributeName):

        (WebCore::HTMLToken::endAttributeName):

        (WebCore::HTMLToken::beginAttributeValue):

        (WebCore::HTMLToken::endAttributeValue):

        (WebCore::HTMLToken::appendToAttributeName):

        (WebCore::HTMLToken::appendToAttributeValue):

        (WebCore::HTMLToken::attributes):

        (WebCore::HTMLToken::eraseValueOfAttribute):

        (WebCore::HTMLToken::ensureIsCharacterToken):

        (WebCore::HTMLToken::characters):

        (WebCore::HTMLToken::appendToCharacter):

        (WebCore::HTMLToken::comment):

        (WebCore::HTMLToken::beginComment):

        (WebCore::HTMLToken::appendToComment):

        (WebCore::HTMLToken::eraseCharacters):

        * html/parser/HTMLTokenTypes.h:

        * html/parser/XSSAuditor.h:

        * xml/parser/MarkupTokenBase.h: Removed.

2013-02-11  Eric Seidel  <eric@webkit.org>

        Make WebVTTTokenizer stop inheriting from MarkupTokenizerBase

        https://bugs.webkit.org/show_bug.cgi?id=109411

Source/WebCore/GNUmakefile.list.am

@@webcore_sources += \

	Source/WebCore/workers/WorkerThread.cpp \

	Source/WebCore/workers/WorkerThread.h \

	Source/WebCore/xml/parser/CharacterReferenceParserInlines.h \

4712 Source/WebCore/xml/parser/MarkupTokenBase.h \

	Source/WebCore/xml/parser/MarkupTokenizerBase.h \

	Source/WebCore/xml/parser/MarkupTokenizerInlines.h \

	Source/WebCore/xml/parser/XMLDocumentParser.cpp \

Source/WebCore/Target.pri

@@HEADERS += \

    workers/WorkerScriptLoader.h \

    workers/WorkerThread.h \

    xml/parser/CharacterReferenceParserInlines.h \

2853 xml/parser/MarkupTokenBase.h \

    xml/parser/MarkupTokenizerBase.h \

    xml/parser/MarkupTokenizerInlines.h \

    xml/parser/XMLDocumentParser.h \

Source/WebCore/WebCore.gypi

            'workers/chromium/WorkerContextProxyChromium.cpp',

            'workers/chromium/WorkerContextProxyChromium.h',

            'xml/parser/CharacterReferenceParserInlines.h',

2673 'xml/parser/MarkupTokenBase.h',

            'xml/parser/MarkupTokenizerBase.h',

            'xml/parser/MarkupTokenizerInlines.h',

            'xml/parser/XMLDocumentParser.cpp',

Source/WebCore/WebCore.vcproj/WebCore.vcproj

				Name="parser"

				>

				<File

					RelativePath="..\xml\parser\MarkupTokenBase.h"

					>

				</File>

				<File

					RelativePath="..\xml\parser\MarkupTokenizerBase.h"

					>

				</File>

Source/WebCore/WebCore.vcxproj/WebCore.vcxproj

    <ClInclude Include="..\xml\XSLTExtensions.h" />

    <ClInclude Include="..\xml\XSLTProcessor.h" />

    <ClInclude Include="..\xml\XSLTUnicodeSort.h" />

7516 <ClInclude Include="..\xml\parser\MarkupTokenBase.h" />

    <ClInclude Include="..\xml\parser\MarkupTokenizerBase.h" />

    <ClInclude Include="..\xml\parser\MarkupTokenizerInlines.h" />

    <ClInclude Include="..\xml\parser\XMLDocumentParser.h" />

Source/WebCore/WebCore.vcxproj/WebCore.vcxproj.filters

    <ClInclude Include="..\xml\XSLTUnicodeSort.h">

      <Filter>xml</Filter>

    </ClInclude>

    <ClInclude Include="..\xml\parser\MarkupTokenBase.h">

      <Filter>xml\parser</Filter>

    </ClInclude>

    <ClInclude Include="..\xml\parser\MarkupTokenizerBase.h">

      <Filter>xml\parser</Filter>

    </ClInclude>

Source/WebCore/WebCore.xcodeproj/project.pbxproj

		0014628A103CD1DE000B20DB /* OriginAccessEntry.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 00146288103CD1DE000B20DB /* OriginAccessEntry.cpp */; };

		0014628B103CD1DE000B20DB /* OriginAccessEntry.h in Headers */ = {isa = PBXBuildFile; fileRef = 00146289103CD1DE000B20DB /* OriginAccessEntry.h */; };

		003F1FEA11E6AB43008258D9 /* UserContentTypes.h in Headers */ = {isa = PBXBuildFile; fileRef = 003F1FE911E6AB43008258D9 /* UserContentTypes.h */; settings = {ATTRIBUTES = (Private, ); }; };

51 00A629C113D0BEC70050AC52 /* MarkupTokenBase.h in Headers */ = {isa = PBXBuildFile; fileRef = 00A629C013D0BEC70050AC52 /* MarkupTokenBase.h */; };

		00B9318713BA8DB30035A948 /* XMLDocumentParser.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 00B9318113BA867F0035A948 /* XMLDocumentParser.cpp */; };

		00B9318813BA8DBA0035A948 /* XMLDocumentParser.h in Headers */ = {isa = PBXBuildFile; fileRef = 00B9318213BA867F0035A948 /* XMLDocumentParser.h */; };

		00B9318913BA8DBC0035A948 /* XMLDocumentParserLibxml2.cpp in Sources */ = {isa = PBXBuildFile; fileRef = 00B9318313BA867F0035A948 /* XMLDocumentParserLibxml2.cpp */; };

		00146288103CD1DE000B20DB /* OriginAccessEntry.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = OriginAccessEntry.cpp; sourceTree = "<group>"; };

		00146289103CD1DE000B20DB /* OriginAccessEntry.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; path = OriginAccessEntry.h; sourceTree = "<group>"; };

		003F1FE911E6AB43008258D9 /* UserContentTypes.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; path = UserContentTypes.h; sourceTree = "<group>"; };

7297 00A629C013D0BEC70050AC52 /* MarkupTokenBase.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; path = MarkupTokenBase.h; sourceTree = "<group>"; };

		00B9318113BA867F0035A948 /* XMLDocumentParser.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = XMLDocumentParser.cpp; sourceTree = "<group>"; };

		00B9318213BA867F0035A948 /* XMLDocumentParser.h */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.c.h; path = XMLDocumentParser.h; sourceTree = "<group>"; };

		00B9318313BA867F0035A948 /* XMLDocumentParserLibxml2.cpp */ = {isa = PBXFileReference; fileEncoding = 4; lastKnownFileType = sourcecode.cpp.cpp; path = XMLDocumentParserLibxml2.cpp; sourceTree = "<group>"; };

			isa = PBXGroup;

			children = (

				97B8FFCF16AE7F920038388D /* CharacterReferenceParserInlines.h */,

14574 00A629C013D0BEC70050AC52 /* MarkupTokenBase.h */,

				00C60E4113D797AE0092A275 /* MarkupTokenizerBase.h */,

				00C60E3E13D76D7E0092A275 /* MarkupTokenizerInlines.h */,

				00B9318113BA867F0035A948 /* XMLDocumentParser.cpp */,

				1A8F6BC60DB55CDC001DB794 /* ManifestParser.h in Headers */,

				93309DF8099E64920056E581 /* markup.h in Headers */,

				9728C3141268E4390041E89B /* MarkupAccumulator.h in Headers */,

25305 00A629C113D0BEC70050AC52 /* MarkupTokenBase.h in Headers */,

				00C60E4213D797AE0092A275 /* MarkupTokenizerBase.h in Headers */,

				00C60E3F13D76D7E0092A275 /* MarkupTokenizerInlines.h in Headers */,

				FABE72F51059C1EB00D999DD /* MathMLElement.h in Headers */,

Source/WebCore/html/parser/HTMLToken.h

11/*

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions

#ifndef HTMLToken_h

#define HTMLToken_h

29#include "Attribute.h"

2930#include "CompactHTMLToken.h"

3031#include "HTMLTokenTypes.h"

31 #include "MarkupTokenBase.h"

#include <wtf/RefCounted.h>

#include <wtf/RefPtr.h>

@@public:

    bool m_forceQuirks;

};

55 class HTMLToken : public MarkupTokenBase<HTMLTokenTypes> {

static inline Attribute* findAttributeInVector(Vector<Attribute>& attributes, const QualifiedName& name)

{

    for (unsigned i = 0; i < attributes.size(); ++i) {

        if (attributes.at(i).name().matches(name))

            return &attributes.at(i);

    }

    return 0;

}

class HTMLToken {

    WTF_MAKE_NONCOPYABLE(HTMLToken);

    WTF_MAKE_FAST_ALLOCATED;

5667public:

57 void appendToName(UChar character)

    typedef HTMLTokenTypes Type;

    class Attribute {

    public:

        class Range {

        public:

            int m_start;

            int m_end;

        };

        Range m_nameRange;

        Range m_valueRange;

        WTF::Vector<UChar, 32> m_name;

        WTF::Vector<UChar, 32> m_value;

    };

    typedef WTF::Vector<Attribute, 10> AttributeList;

    typedef WTF::Vector<UChar, 1024> DataVector;

    HTMLToken() { clear(); }

    void clear()

5890 {

59 ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag || m_type == HTMLTokenTypes::DOCTYPE);

60 MarkupTokenBase<HTMLTokenTypes>::appendToName(character);

        m_type = Type::Uninitialized;

        m_range.m_start = 0;

        m_range.m_end = 0;

        m_baseOffset = 0;

        m_data.clear();

        m_orAllData = 0;

    }

    bool isUninitialized() { return m_type == HTMLTokenTypes::Uninitialized; }

    typename HTMLTokenTypes::Type type() const { return m_type; }

    void makeEndOfFile()

    {

        ASSERT(m_type == HTMLTokenTypes::Uninitialized);

        m_type = HTMLTokenTypes::EndOfFile;

    }

    /* Range and offset methods exposed for HTMLSourceTracker and HTMLViewSourceParser */

    int startIndex() const { return m_range.m_start; }

    int endIndex() const { return m_range.m_end; }

    void setBaseOffset(int offset)

    {

        m_baseOffset = offset;

    }

    void end(int endOffset)

    {

        m_range.m_end = endOffset - m_baseOffset;

    }

    const DataVector& data() const

    {

        ASSERT(m_type == HTMLTokenTypes::Character || m_type == HTMLTokenTypes::Comment || m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        return m_data;

    }

    bool isAll8BitData() const

    {

        return (m_orAllData <= 0xff);

    }

    const DataVector& name() const

    {

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag || m_type == HTMLTokenTypes::DOCTYPE);

66 return MarkupTokenBase<HTMLTokenTypes>::name();

        return m_data;

    }

    void appendToName(UChar character)

    {

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag || m_type == HTMLTokenTypes::DOCTYPE);

        ASSERT(character);

        m_data.append(character);

        m_orAllData |= character;

    }

    // FIXME: Rename this to copyNameAsString().

    String nameString() const

    {

        if (!m_data.size())

            return emptyString();

        if (isAll8BitData())

            return String::make8BitFrom16BitSource(m_data.data(), m_data.size());

        return String(m_data.data(), m_data.size());

67155 }

68156

157 /* DOCTYPE Tokens */

158

    bool forceQuirks() const

    {

        ASSERT(m_type == HTMLTokenTypes::DOCTYPE);

@@public:

        return m_doctypeData.release();

    }

    /* Start/End Tag Tokens */

    bool selfClosing() const

    {

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        return m_selfClosing;

    }

    void setSelfClosing()

    {

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        m_selfClosing = true;

    }

    void beginStartTag(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == HTMLTokenTypes::Uninitialized);

        m_type = HTMLTokenTypes::StartTag;

        m_selfClosing = false;

        m_currentAttribute = 0;

        m_attributes.clear();

        m_data.append(character);

        m_orAllData |= character;

    }

    void beginEndTag(LChar character)

    {

        ASSERT(m_type == HTMLTokenTypes::Uninitialized);

        m_type = HTMLTokenTypes::EndTag;

        m_selfClosing = false;

        m_currentAttribute = 0;

        m_attributes.clear();

        m_data.append(character);

    }

    void beginEndTag(const Vector<LChar, 32>& characters)

    {

        ASSERT(m_type == HTMLTokenTypes::Uninitialized);

        m_type = HTMLTokenTypes::EndTag;

        m_selfClosing = false;

        m_currentAttribute = 0;

        m_attributes.clear();

        m_data.appendVector(characters);

    }

    void addNewAttribute()

    {

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        m_attributes.grow(m_attributes.size() + 1);

        m_currentAttribute = &m_attributes.last();

#ifndef NDEBUG

        m_currentAttribute->m_nameRange.m_start = 0;

        m_currentAttribute->m_nameRange.m_end = 0;

        m_currentAttribute->m_valueRange.m_start = 0;

        m_currentAttribute->m_valueRange.m_end = 0;

#endif

    }

    void beginAttributeName(int offset)

    {

        m_currentAttribute->m_nameRange.m_start = offset - m_baseOffset;

    }

    void endAttributeName(int offset)

    {

        int index = offset - m_baseOffset;

        m_currentAttribute->m_nameRange.m_end = index;

        m_currentAttribute->m_valueRange.m_start = index;

        m_currentAttribute->m_valueRange.m_end = index;

    }

    void beginAttributeValue(int offset)

    {

        m_currentAttribute->m_valueRange.m_start = offset - m_baseOffset;

#ifndef NDEBUG

        m_currentAttribute->m_valueRange.m_end = 0;

#endif

    }

    void endAttributeValue(int offset)

    {

        m_currentAttribute->m_valueRange.m_end = offset - m_baseOffset;

    }

    void appendToAttributeName(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        // FIXME: We should be able to add the following ASSERT once we fix

        // https://bugs.webkit.org/show_bug.cgi?id=62971

        //   ASSERT(m_currentAttribute->m_nameRange.m_start);

        m_currentAttribute->m_name.append(character);

    }

    void appendToAttributeValue(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        ASSERT(m_currentAttribute->m_valueRange.m_start);

        m_currentAttribute->m_value.append(character);

    }

    void appendToAttributeValue(size_t i, const String& value)

    {

        ASSERT(!value.isEmpty());

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        m_attributes[i].m_value.append(value.characters(), value.length());

    }

    const AttributeList& attributes() const

    {

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        return m_attributes;

    }

    // Used by the XSSAuditor to nuke XSS-laden attributes.

    void eraseValueOfAttribute(size_t i)

    {

        ASSERT(m_type == HTMLTokenTypes::StartTag || m_type == HTMLTokenTypes::EndTag);

        m_attributes[i].m_value.clear();

    }

    /* Character Tokens */

    // Starting a character token works slightly differently than starting

    // other types of tokens because we want to save a per-character branch.

    void ensureIsCharacterToken()

    {

        ASSERT(m_type == HTMLTokenTypes::Uninitialized || m_type == HTMLTokenTypes::Character);

        m_type = HTMLTokenTypes::Character;

    }

    const DataVector& characters() const

    {

        ASSERT(m_type == HTMLTokenTypes::Character);

        return m_data;

    }

    void appendToCharacter(char character)

    {

        ASSERT(m_type == HTMLTokenTypes::Character);

        m_data.append(character);

    }

    void appendToCharacter(UChar character)

    {

        ASSERT(m_type == HTMLTokenTypes::Character);

        m_data.append(character);

        m_orAllData |= character;

    }

    void appendToCharacter(const Vector<LChar, 32>& characters)

    {

        ASSERT(m_type == HTMLTokenTypes::Character);

        m_data.appendVector(characters);

    }

    /* Comment Tokens */

    const DataVector& comment() const

    {

        ASSERT(m_type == HTMLTokenTypes::Comment);

        return m_data;

    }

    void beginComment()

    {

        ASSERT(m_type == HTMLTokenTypes::Uninitialized);

        m_type = HTMLTokenTypes::Comment;

    }

    void appendToComment(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == HTMLTokenTypes::Comment);

        m_data.append(character);

        m_orAllData |= character;

    }

    void eraseCharacters()

    {

        ASSERT(m_type == HTMLTokenTypes::Character);

        m_data.clear();

        m_orAllData = 0;

    }

145425private:

    typename HTMLTokenTypes::Type m_type;

    typename Attribute::Range m_range; // Always starts at zero.

    int m_baseOffset;

    DataVector m_data;

    UChar m_orAllData;

    // For StartTag and EndTag

    bool m_selfClosing;

    AttributeList m_attributes;

    // A pointer into m_attributes used during lexing.

    Attribute* m_currentAttribute;

    // For DOCTYPE

    OwnPtr<DoctypeData> m_doctypeData;

};

Source/WebCore/html/parser/HTMLTokenTypes.h

#ifndef HTMLTokenTypes_h

#define HTMLTokenTypes_h

#include "MarkupTokenBase.h"

#include <wtf/Noncopyable.h>

namespace WebCore {

class HTMLTokenTypes {

Source/WebCore/html/parser/XSSAuditor.h

#include "HTMLToken.h"

#include "HTTPParsers.h"

31#include "KURL.h"

#include "SuffixTree.h"

#include "TextEncoding.h"

#include <wtf/PassOwnPtr.h>

Source/WebCore/xml/parser/MarkupTokenBase.h

/*

 * Copyright (C) 2010 Google, Inc. All Rights Reserved.

 * Copyright (C) 2011 Apple Inc. All Rights Reserved.

 *

 * Redistribution and use in source and binary forms, with or without

 * modification, are permitted provided that the following conditions

 * are met:

 * 1. Redistributions of source code must retain the above copyright

 *    notice, this list of conditions and the following disclaimer.

 * 2. Redistributions in binary form must reproduce the above copyright

 *    notice, this list of conditions and the following disclaimer in the

 *    documentation and/or other materials provided with the distribution.

 *

 * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY

 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE

 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR

 * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL APPLE INC. OR

 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,

 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,

 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR

 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY

 * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

 */

#ifndef MarkupTokenBase_h

#define MarkupTokenBase_h

#include "ElementAttributeData.h"

#include <wtf/Vector.h>

#ifndef NDEBUG

#include <stdio.h>

#endif

namespace WebCore {

static inline Attribute* findAttributeInVector(Vector<Attribute>& attributes, const QualifiedName& name)

{

    for (unsigned i = 0; i < attributes.size(); ++i) {

        if (attributes.at(i).name().matches(name))

            return &attributes.at(i);

    }

    return 0;

}

template<typename TypeSet>

class MarkupTokenBase {

    WTF_MAKE_NONCOPYABLE(MarkupTokenBase);

    WTF_MAKE_FAST_ALLOCATED;

public:

    typedef TypeSet Type;

    class Attribute {

    public:

        class Range {

        public:

            int m_start;

            int m_end;

        };

        Range m_nameRange;

        Range m_valueRange;

        WTF::Vector<UChar, 32> m_name;

        WTF::Vector<UChar, 32> m_value;

    };

    typedef WTF::Vector<Attribute, 10> AttributeList;

    typedef WTF::Vector<UChar, 1024> DataVector;

    MarkupTokenBase() { clear(); }

    virtual ~MarkupTokenBase() { }

    virtual void clear()

    {

        m_type = TypeSet::Uninitialized;

        m_range.m_start = 0;

        m_range.m_end = 0;

        m_baseOffset = 0;

        m_data.clear();

        m_orAllData = 0;

    }

    bool isUninitialized() { return m_type == TypeSet::Uninitialized; }

    int startIndex() const { return m_range.m_start; }

    int endIndex() const { return m_range.m_end; }

    void setBaseOffset(int offset)

    {

        m_baseOffset = offset;

    }

    void end(int endOffset)

    {

        m_range.m_end = endOffset - m_baseOffset;

    }

    void makeEndOfFile()

    {

        ASSERT(m_type == TypeSet::Uninitialized);

        m_type = TypeSet::EndOfFile;

    }

    void beginStartTag(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == TypeSet::Uninitialized);

        m_type = TypeSet::StartTag;

        m_selfClosing = false;

        m_currentAttribute = 0;

        m_attributes.clear();

        m_data.append(character);

        m_orAllData |= character;

    }

    void beginEndTag(LChar character)

    {

        ASSERT(m_type == TypeSet::Uninitialized);

        m_type = TypeSet::EndTag;

        m_selfClosing = false;

        m_currentAttribute = 0;

        m_attributes.clear();

        m_data.append(character);

    }

    void beginEndTag(const Vector<LChar, 32>& characters)

    {

        ASSERT(m_type == TypeSet::Uninitialized);

        m_type = TypeSet::EndTag;

        m_selfClosing = false;

        m_currentAttribute = 0;

        m_attributes.clear();

        m_data.appendVector(characters);

    }

    // Starting a character token works slightly differently than starting

    // other types of tokens because we want to save a per-character branch.

    void ensureIsCharacterToken()

    {

        ASSERT(m_type == TypeSet::Uninitialized || m_type == TypeSet::Character);

        m_type = TypeSet::Character;

    }

    void beginComment()

    {

        ASSERT(m_type == TypeSet::Uninitialized);

        m_type = TypeSet::Comment;

    }

    void appendToCharacter(char character)

    {

        ASSERT(m_type == TypeSet::Character);

        m_data.append(character);

    }

    void appendToCharacter(UChar character)

    {

        ASSERT(m_type == TypeSet::Character);

        m_data.append(character);

        m_orAllData |= character;

    }

    void appendToCharacter(const Vector<LChar, 32>& characters)

    {

        ASSERT(m_type == TypeSet::Character);

        m_data.appendVector(characters);

    }

    void appendToComment(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == TypeSet::Comment);

        m_data.append(character);

        m_orAllData |= character;

    }

    void addNewAttribute()

    {

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        m_attributes.grow(m_attributes.size() + 1);

        m_currentAttribute = &m_attributes.last();

#ifndef NDEBUG

        m_currentAttribute->m_nameRange.m_start = 0;

        m_currentAttribute->m_nameRange.m_end = 0;

        m_currentAttribute->m_valueRange.m_start = 0;

        m_currentAttribute->m_valueRange.m_end = 0;

#endif

    }

    void beginAttributeName(int offset)

    {

        m_currentAttribute->m_nameRange.m_start = offset - m_baseOffset;

    }

    void endAttributeName(int offset)

    {

        int index = offset - m_baseOffset;

        m_currentAttribute->m_nameRange.m_end = index;

        m_currentAttribute->m_valueRange.m_start = index;

        m_currentAttribute->m_valueRange.m_end = index;

    }

    void beginAttributeValue(int offset)

    {

        m_currentAttribute->m_valueRange.m_start = offset - m_baseOffset;

#ifndef NDEBUG

        m_currentAttribute->m_valueRange.m_end = 0;

#endif

    }

    void endAttributeValue(int offset)

    {

        m_currentAttribute->m_valueRange.m_end = offset - m_baseOffset;

    }

    void appendToAttributeName(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        // FIXME: We should be able to add the following ASSERT once we fix

        // https://bugs.webkit.org/show_bug.cgi?id=62971

        //   ASSERT(m_currentAttribute->m_nameRange.m_start);

        m_currentAttribute->m_name.append(character);

    }

    void appendToAttributeValue(UChar character)

    {

        ASSERT(character);

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        ASSERT(m_currentAttribute->m_valueRange.m_start);

        m_currentAttribute->m_value.append(character);

    }

    void appendToAttributeValue(size_t i, const String& value)

    {

        ASSERT(!value.isEmpty());

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        m_attributes[i].m_value.append(value.characters(), value.length());

    }

    typename Type::Type type() const { return m_type; }

    bool selfClosing() const

    {

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        return m_selfClosing;

    }

    void setSelfClosing()

    {

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        m_selfClosing = true;

    }

    const AttributeList& attributes() const

    {

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        return m_attributes;

    }

    void eraseCharacters()

    {

        ASSERT(m_type == TypeSet::Character);

        m_data.clear();

        m_orAllData = 0;

    }

    void eraseValueOfAttribute(size_t i)

    {

        ASSERT(m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        m_attributes[i].m_value.clear();

    }

    const DataVector& characters() const

    {

        ASSERT(m_type == TypeSet::Character);

        return m_data;

    }

    const DataVector& comment() const

    {

        ASSERT(m_type == TypeSet::Comment);

        return m_data;

    }

    const DataVector& data() const

    {

        ASSERT(m_type == TypeSet::Character || m_type == TypeSet::Comment || m_type == TypeSet::StartTag || m_type == TypeSet::EndTag);

        return m_data;

    }

    bool isAll8BitData() const

    {

        return (m_orAllData <= 0xff);

    }

    const DataVector& name() const

    {

        return m_data;

    }

    String nameString() const

    {

        if (!m_data.size())

            return emptyString();

        if (isAll8BitData())

            return String::make8BitFrom16BitSource(m_data.data(), m_data.size());

        return String(m_data.data(), m_data.size());

    }

protected:

#ifndef NDEBUG

    void printString(const DataVector& string) const

    {

        DataVector::const_iterator iter = string.begin();

        for (; iter != string.end(); ++iter)

            fprintf(stderr, "%lc", wchar_t(*iter));

    }

#endif // NDEBUG

    void appendToName(UChar character)

    {

        ASSERT(character);

        m_data.append(character);

        m_orAllData |= character;

    }

    typename Type::Type m_type;

    typename Attribute::Range m_range; // Always starts at zero.

    int m_baseOffset;

    DataVector m_data;

    UChar m_orAllData;

    // For StartTag and EndTag

    bool m_selfClosing;

    AttributeList m_attributes;

    // A pointer into m_attributes used during lexing.

    Attribute* m_currentAttribute;

};

}

#endif // MarkupTokenBase_h