1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
|
/*
* Copyright (C) 2010 Google, Inc. All Rights Reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY GOOGLE INC. ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL GOOGLE INC. OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "config.h"
#include "HTML5TreeBuilder.h"
#include "Attribute.h"
#include "HTML5Lexer.h"
#include "HTML5Token.h"
#include "HTMLDocument.h"
#include "HTMLParser.h"
#include "HTMLTokenizer.h"
#include "NotImplemented.h"
namespace WebCore {
HTML5TreeBuilder::HTML5TreeBuilder(HTML5Lexer* lexer, HTMLDocument* document, bool reportErrors)
: m_document(document)
, m_reportErrors(reportErrors)
, m_lexer(lexer)
, m_legacyHTMLParser(new HTMLParser(document, reportErrors))
{
}
HTML5TreeBuilder::~HTML5TreeBuilder()
{
}
static void convertToOldStyle(HTML5Token& token, Token& oldStyleToken)
{
switch (token.type()) {
case HTML5Token::Uninitialized:
ASSERT_NOT_REACHED();
break;
case HTML5Token::DOCTYPE:
case HTML5Token::EndOfFile:
ASSERT_NOT_REACHED();
notImplemented();
break;
case HTML5Token::StartTag:
case HTML5Token::EndTag: {
oldStyleToken.beginTag = (token.type() == HTML5Token::StartTag);
oldStyleToken.selfClosingTag = token.selfClosing();
oldStyleToken.tagName = token.name();
HTML5Token::AttributeList& attributes = token.attributes();
for (HTML5Token::AttributeList::iterator iter = attributes.begin();
iter != attributes.end(); ++iter) {
if (!iter->m_name.isEmpty()) {
String name = String(StringImpl::adopt(iter->m_name));
String value = String(StringImpl::adopt(iter->m_value));
RefPtr<Attribute> mappedAttribute = Attribute::createMapped(name, value);
if (!oldStyleToken.attrs)
oldStyleToken.attrs = NamedNodeMap::create();
oldStyleToken.attrs->insertAttribute(mappedAttribute.release(), false);
}
}
break;
}
case HTML5Token::Comment:
oldStyleToken.tagName = commentAtom;
oldStyleToken.text = token.data().impl();
break;
case HTML5Token::Character:
oldStyleToken.tagName = textAtom;
oldStyleToken.text = token.characters().impl();
break;
}
}
PassRefPtr<Node> HTML5TreeBuilder::passTokenToLegacyParser(HTML5Token& token)
{
if (token.type() == HTML5Token::StartTag && token.name() == "script") {
// This work is supposed to be done by the parser, but
// when using the old parser for we have to do this manually.
m_lexer->setState(HTML5Lexer::ScriptDataState);
}
// For now, we translate into an old-style token for testing.
Token oldStyleToken;
convertToOldStyle(token, oldStyleToken);
return m_legacyHTMLParser->parseToken(&oldStyleToken);
}
PassRefPtr<Node> HTML5TreeBuilder::constructTreeFromToken(HTML5Token& token)
{
return passTokenToLegacyParser(token);
// Our HTML5 parser implementation will go here in a separate patch.
}
void HTML5TreeBuilder::finished()
{
m_legacyHTMLParser->finished();
}
}
|