summaryrefslogtreecommitdiffstats
path: root/WebCore/html/LegacyPreloadScanner.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'WebCore/html/LegacyPreloadScanner.cpp')
-rw-r--r--WebCore/html/LegacyPreloadScanner.cpp856
1 files changed, 856 insertions, 0 deletions
diff --git a/WebCore/html/LegacyPreloadScanner.cpp b/WebCore/html/LegacyPreloadScanner.cpp
new file mode 100644
index 0000000..c9fda4f
--- /dev/null
+++ b/WebCore/html/LegacyPreloadScanner.cpp
@@ -0,0 +1,856 @@
+/*
+ * Copyright (C) 2008 Apple Inc. All Rights Reserved.
+ * Copyright (C) 2009 Torch Mobile, Inc. http://www.torchmobile.com/
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ * 1. Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * 2. Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ *
+ * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
+ * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+ * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
+ * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+ * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+ * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+ * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
+ * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
+ * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
+ */
+
+#include "config.h"
+#include "LegacyPreloadScanner.h"
+
+#include "AtomicString.h"
+#include "CachedCSSStyleSheet.h"
+#include "CachedImage.h"
+#include "CachedResource.h"
+#include "CachedResourceClient.h"
+#include "CachedScript.h"
+#include "CSSHelper.h"
+#include "DocLoader.h"
+#include "Document.h"
+#include "Frame.h"
+#include "FrameLoader.h"
+#include "HTMLLinkElement.h"
+#include "HTMLNames.h"
+#include <wtf/text/CString.h>
+#include <wtf/CurrentTime.h>
+#include <wtf/unicode/Unicode.h>
+
+// Use __GNUC__ instead of PLATFORM(GCC) to stay consistent with the gperf generated c file
+#ifdef __GNUC__
+// The main tokenizer includes this too so we are getting two copies of the data. However, this way the code gets inlined.
+#include "HTMLEntityNames.cpp"
+#else
+// Not inlined for non-GCC compilers
+struct Entity {
+ const char* name;
+ int code;
+};
+const struct Entity* findEntity(register const char* str, register unsigned int len);
+#endif
+
+#define PRELOAD_DEBUG 0
+
+using namespace WTF;
+
+namespace WebCore {
+
+using namespace HTMLNames;
+
+LegacyPreloadScanner::LegacyPreloadScanner(Document* doc)
+ : m_inProgress(false)
+ , m_timeUsed(0)
+ , m_bodySeen(false)
+ , m_document(doc)
+{
+#if PRELOAD_DEBUG
+ printf("CREATING PRELOAD SCANNER FOR %s\n", m_document->url().string().latin1().data());
+#endif
+}
+
+LegacyPreloadScanner::~LegacyPreloadScanner()
+{
+#if PRELOAD_DEBUG
+ printf("DELETING PRELOAD SCANNER FOR %s\n", m_document->url().string().latin1().data());
+ printf("TOTAL TIME USED %.4fs\n", m_timeUsed);
+#endif
+}
+
+void LegacyPreloadScanner::begin()
+{
+ ASSERT(!m_inProgress);
+ reset();
+ m_inProgress = true;
+}
+
+void LegacyPreloadScanner::end()
+{
+ ASSERT(m_inProgress);
+ m_inProgress = false;
+}
+
+void LegacyPreloadScanner::reset()
+{
+ m_source.clear();
+
+ m_state = Data;
+ m_escape = false;
+ m_contentModel = PCDATA;
+ m_commentPos = 0;
+
+ m_closeTag = false;
+ m_tagName.clear();
+ m_attributeName.clear();
+ m_attributeValue.clear();
+ m_lastStartTag = AtomicString();
+
+ m_urlToLoad = String();
+ m_charset = String();
+ m_linkIsStyleSheet = false;
+ m_lastCharacterIndex = 0;
+ clearLastCharacters();
+
+ m_cssState = CSSInitial;
+ m_cssRule.clear();
+ m_cssRuleValue.clear();
+}
+
+bool LegacyPreloadScanner::scanningBody() const
+{
+ return m_document->body() || m_bodySeen;
+}
+
+void LegacyPreloadScanner::write(const SegmentedString& source)
+{
+#if PRELOAD_DEBUG
+ double startTime = currentTime();
+#endif
+ tokenize(source);
+#if PRELOAD_DEBUG
+ m_timeUsed += currentTime() - startTime;
+#endif
+}
+
+static inline bool isWhitespace(UChar c)
+{
+ return c == ' ' || c == '\n' || c == '\r' || c == '\t';
+}
+
+inline void LegacyPreloadScanner::clearLastCharacters()
+{
+ memset(m_lastCharacters, 0, lastCharactersBufferSize * sizeof(UChar));
+}
+
+inline void LegacyPreloadScanner::rememberCharacter(UChar c)
+{
+ m_lastCharacterIndex = (m_lastCharacterIndex + 1) % lastCharactersBufferSize;
+ m_lastCharacters[m_lastCharacterIndex] = c;
+}
+
+inline bool LegacyPreloadScanner::lastCharactersMatch(const char* chars, unsigned count) const
+{
+ unsigned pos = m_lastCharacterIndex;
+ while (count) {
+ if (chars[count - 1] != m_lastCharacters[pos])
+ return false;
+ --count;
+ if (!pos)
+ pos = lastCharactersBufferSize;
+ --pos;
+ }
+ return true;
+}
+
+static inline unsigned legalEntityFor(unsigned value)
+{
+ // FIXME There is a table for more exceptions in the HTML5 specification.
+ if (value == 0 || value > 0x10FFFF || (value >= 0xD800 && value <= 0xDFFF))
+ return 0xFFFD;
+ return value;
+}
+
+unsigned LegacyPreloadScanner::consumeEntity(SegmentedString& source, bool& notEnoughCharacters)
+{
+ enum EntityState {
+ Initial,
+ NumberType,
+ MaybeHex,
+ Hex,
+ Decimal,
+ Named
+ };
+ EntityState entityState = Initial;
+ unsigned result = 0;
+ Vector<UChar, 10> seenChars;
+ Vector<char, 10> entityName;
+
+ while (!source.isEmpty()) {
+ UChar cc = *source;
+ seenChars.append(cc);
+ switch (entityState) {
+ case Initial:
+ if (isWhitespace(cc) || cc == '<' || cc == '&')
+ return 0;
+ else if (cc == '#')
+ entityState = NumberType;
+ else if ((cc >= 'a' && cc <= 'z') || (cc >= 'A' && cc <= 'Z')) {
+ entityName.append(cc);
+ entityState = Named;
+ } else
+ return 0;
+ break;
+ case NumberType:
+ if (cc == 'x' || cc == 'X')
+ entityState = MaybeHex;
+ else if (cc >= '0' && cc <= '9') {
+ entityState = Decimal;
+ result = cc - '0';
+ } else {
+ source.push('#');
+ return 0;
+ }
+ break;
+ case MaybeHex:
+ if (cc >= '0' && cc <= '9')
+ result = cc - '0';
+ else if (cc >= 'a' && cc <= 'f')
+ result = 10 + cc - 'a';
+ else if (cc >= 'A' && cc <= 'F')
+ result = 10 + cc - 'A';
+ else {
+ source.push('#');
+ source.push(seenChars[1]);
+ return 0;
+ }
+ entityState = Hex;
+ break;
+ case Hex:
+ if (cc >= '0' && cc <= '9')
+ result = result * 16 + cc - '0';
+ else if (cc >= 'a' && cc <= 'f')
+ result = result * 16 + 10 + cc - 'a';
+ else if (cc >= 'A' && cc <= 'F')
+ result = result * 16 + 10 + cc - 'A';
+ else if (cc == ';') {
+ source.advance();
+ return legalEntityFor(result);
+ } else
+ return legalEntityFor(result);
+ break;
+ case Decimal:
+ if (cc >= '0' && cc <= '9')
+ result = result * 10 + cc - '0';
+ else if (cc == ';') {
+ source.advance();
+ return legalEntityFor(result);
+ } else
+ return legalEntityFor(result);
+ break;
+ case Named:
+ // This is the attribute only version, generic version matches somewhat differently
+ while (entityName.size() <= 8) {
+ if (cc == ';') {
+ const Entity* entity = findEntity(entityName.data(), entityName.size());
+ if (entity) {
+ source.advance();
+ return entity->code;
+ }
+ break;
+ }
+ if (!(cc >= 'a' && cc <= 'z') && !(cc >= 'A' && cc <= 'Z') && !(cc >= '0' && cc <= '9')) {
+ const Entity* entity = findEntity(entityName.data(), entityName.size());
+ if (entity)
+ return entity->code;
+ break;
+ }
+ entityName.append(cc);
+ source.advance();
+ if (source.isEmpty())
+ goto outOfCharacters;
+ cc = *source;
+ seenChars.append(cc);
+ }
+ if (seenChars.size() == 2)
+ source.push(seenChars[0]);
+ else if (seenChars.size() == 3) {
+ source.push(seenChars[0]);
+ source.push(seenChars[1]);
+ } else
+ source.prepend(SegmentedString(String(seenChars.data(), seenChars.size() - 1)));
+ return 0;
+ }
+ source.advance();
+ }
+outOfCharacters:
+ notEnoughCharacters = true;
+ source.prepend(SegmentedString(String(seenChars.data(), seenChars.size())));
+ return 0;
+}
+
+void LegacyPreloadScanner::tokenize(const SegmentedString& source)
+{
+ ASSERT(m_inProgress);
+
+ m_source.append(source);
+
+ // This is a simplified HTML5 Tokenizer
+ // http://www.whatwg.org/specs/web-apps/current-work/#tokenisation0
+ while (!m_source.isEmpty()) {
+ UChar cc = *m_source;
+ switch (m_state) {
+ case Data:
+ while (1) {
+ rememberCharacter(cc);
+ if (cc == '&') {
+ if (m_contentModel == PCDATA || m_contentModel == RCDATA) {
+ m_state = EntityData;
+ break;
+ }
+ } else if (cc == '-') {
+ if ((m_contentModel == RCDATA || m_contentModel == CDATA) && !m_escape) {
+ if (lastCharactersMatch("<!--", 4))
+ m_escape = true;
+ }
+ } else if (cc == '<') {
+ if (m_contentModel == PCDATA || ((m_contentModel == RCDATA || m_contentModel == CDATA) && !m_escape)) {
+ m_state = TagOpen;
+ break;
+ }
+ } else if (cc == '>') {
+ if ((m_contentModel == RCDATA || m_contentModel == CDATA) && m_escape) {
+ if (lastCharactersMatch("-->", 3))
+ m_escape = false;
+ }
+ }
+ emitCharacter(cc);
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case EntityData:
+ // should try to consume the entity but we only care about entities in attributes
+ m_state = Data;
+ break;
+ case TagOpen:
+ if (m_contentModel == RCDATA || m_contentModel == CDATA) {
+ if (cc == '/')
+ m_state = CloseTagOpen;
+ else {
+ m_state = Data;
+ continue;
+ }
+ } else if (m_contentModel == PCDATA) {
+ if (cc == '!')
+ m_state = MarkupDeclarationOpen;
+ else if (cc == '/')
+ m_state = CloseTagOpen;
+ else if (cc >= 'A' && cc <= 'Z') {
+ m_tagName.clear();
+ m_charset = String();
+ m_tagName.append(cc + 0x20);
+ m_closeTag = false;
+ m_state = TagName;
+ } else if (cc >= 'a' && cc <= 'z') {
+ m_tagName.clear();
+ m_charset = String();
+ m_tagName.append(cc);
+ m_closeTag = false;
+ m_state = TagName;
+ } else if (cc == '>') {
+ m_state = Data;
+ } else if (cc == '?') {
+ m_state = BogusComment;
+ } else {
+ m_state = Data;
+ continue;
+ }
+ }
+ break;
+ case CloseTagOpen:
+ if (m_contentModel == RCDATA || m_contentModel == CDATA) {
+ if (!m_lastStartTag.length()) {
+ m_state = Data;
+ continue;
+ }
+ if (m_source.length() < m_lastStartTag.length() + 1)
+ return;
+ Vector<UChar> tmpString;
+ UChar tmpChar = 0;
+ bool match = true;
+ for (unsigned n = 0; n < m_lastStartTag.length() + 1; n++) {
+ tmpChar = Unicode::toLower(*m_source);
+ if (n < m_lastStartTag.length() && tmpChar != m_lastStartTag[n])
+ match = false;
+ tmpString.append(tmpChar);
+ m_source.advance();
+ }
+ m_source.prepend(SegmentedString(String(tmpString.data(), tmpString.size())));
+ if (!match || (!isWhitespace(tmpChar) && tmpChar != '>' && tmpChar != '/')) {
+ m_state = Data;
+ continue;
+ }
+ }
+ if (cc >= 'A' && cc <= 'Z') {
+ m_tagName.clear();
+ m_charset = String();
+ m_tagName.append(cc + 0x20);
+ m_closeTag = true;
+ m_state = TagName;
+ } else if (cc >= 'a' && cc <= 'z') {
+ m_tagName.clear();
+ m_charset = String();
+ m_tagName.append(cc);
+ m_closeTag = true;
+ m_state = TagName;
+ } else if (cc == '>') {
+ m_state = Data;
+ } else
+ m_state = BogusComment;
+ break;
+ case TagName:
+ while (1) {
+ if (isWhitespace(cc)) {
+ m_state = BeforeAttributeName;
+ break;
+ }
+ if (cc == '>') {
+ emitTag();
+ m_state = Data;
+ break;
+ }
+ if (cc == '/') {
+ m_state = BeforeAttributeName;
+ break;
+ }
+ if (cc >= 'A' && cc <= 'Z')
+ m_tagName.append(cc + 0x20);
+ else
+ m_tagName.append(cc);
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case BeforeAttributeName:
+ if (isWhitespace(cc))
+ ;
+ else if (cc == '>') {
+ emitTag();
+ m_state = Data;
+ } else if (cc >= 'A' && cc <= 'Z') {
+ m_attributeName.clear();
+ m_attributeValue.clear();
+ m_attributeName.append(cc + 0x20);
+ m_state = AttributeName;
+ } else if (cc == '/')
+ ;
+ else {
+ m_attributeName.clear();
+ m_attributeValue.clear();
+ m_attributeName.append(cc);
+ m_state = AttributeName;
+ }
+ break;
+ case AttributeName:
+ while (1) {
+ if (isWhitespace(cc)) {
+ m_state = AfterAttributeName;
+ break;
+ }
+ if (cc == '=') {
+ m_state = BeforeAttributeValue;
+ break;
+ }
+ if (cc == '>') {
+ emitTag();
+ m_state = Data;
+ break;
+ }
+ if (cc == '/') {
+ m_state = BeforeAttributeName;
+ break;
+ }
+ if (cc >= 'A' && cc <= 'Z')
+ m_attributeName.append(cc + 0x20);
+ else
+ m_attributeName.append(cc);
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case AfterAttributeName:
+ if (isWhitespace(cc))
+ ;
+ else if (cc == '=')
+ m_state = BeforeAttributeValue;
+ else if (cc == '>') {
+ emitTag();
+ m_state = Data;
+ } else if (cc >= 'A' && cc <= 'Z') {
+ m_attributeName.clear();
+ m_attributeValue.clear();
+ m_attributeName.append(cc + 0x20);
+ m_state = AttributeName;
+ } else if (cc == '/')
+ m_state = BeforeAttributeName;
+ else {
+ m_attributeName.clear();
+ m_attributeValue.clear();
+ m_attributeName.append(cc);
+ m_state = AttributeName;
+ }
+ break;
+ case BeforeAttributeValue:
+ if (isWhitespace(cc))
+ ;
+ else if (cc == '"')
+ m_state = AttributeValueDoubleQuoted;
+ else if (cc == '&') {
+ m_state = AttributeValueUnquoted;
+ continue;
+ } else if (cc == '\'')
+ m_state = AttributeValueSingleQuoted;
+ else if (cc == '>') {
+ emitTag();
+ m_state = Data;
+ } else {
+ m_attributeValue.append(cc);
+ m_state = AttributeValueUnquoted;
+ }
+ break;
+ case AttributeValueDoubleQuoted:
+ while (1) {
+ if (cc == '"') {
+ processAttribute();
+ m_state = BeforeAttributeName;
+ break;
+ }
+ if (cc == '&') {
+ m_stateBeforeEntityInAttributeValue = m_state;
+ m_state = EntityInAttributeValue;
+ break;
+ }
+ m_attributeValue.append(cc);
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case AttributeValueSingleQuoted:
+ while (1) {
+ if (cc == '\'') {
+ processAttribute();
+ m_state = BeforeAttributeName;
+ break;
+ }
+ if (cc == '&') {
+ m_stateBeforeEntityInAttributeValue = m_state;
+ m_state = EntityInAttributeValue;
+ break;
+ }
+ m_attributeValue.append(cc);
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case AttributeValueUnquoted:
+ while (1) {
+ if (isWhitespace(cc)) {
+ processAttribute();
+ m_state = BeforeAttributeName;
+ break;
+ }
+ if (cc == '&') {
+ m_stateBeforeEntityInAttributeValue = m_state;
+ m_state = EntityInAttributeValue;
+ break;
+ }
+ if (cc == '>') {
+ processAttribute();
+ emitTag();
+ m_state = Data;
+ break;
+ }
+ m_attributeValue.append(cc);
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case EntityInAttributeValue:
+ {
+ bool notEnoughCharacters = false;
+ unsigned entity = consumeEntity(m_source, notEnoughCharacters);
+ if (notEnoughCharacters)
+ return;
+ if (entity > 0xFFFF) {
+ m_attributeValue.append(U16_LEAD(entity));
+ m_attributeValue.append(U16_TRAIL(entity));
+ } else if (entity)
+ m_attributeValue.append(entity);
+ else
+ m_attributeValue.append('&');
+ }
+ m_state = m_stateBeforeEntityInAttributeValue;
+ continue;
+ case BogusComment:
+ while (1) {
+ if (cc == '>') {
+ m_state = Data;
+ break;
+ }
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case MarkupDeclarationOpen: {
+ if (cc == '-') {
+ if (m_source.length() < 2)
+ return;
+ m_source.advance();
+ cc = *m_source;
+ if (cc == '-')
+ m_state = CommentStart;
+ else {
+ m_state = BogusComment;
+ continue;
+ }
+ // If we cared about the DOCTYPE we would test to enter those states here
+ } else {
+ m_state = BogusComment;
+ continue;
+ }
+ break;
+ }
+ case CommentStart:
+ if (cc == '-')
+ m_state = CommentStartDash;
+ else if (cc == '>')
+ m_state = Data;
+ else
+ m_state = Comment;
+ break;
+ case CommentStartDash:
+ if (cc == '-')
+ m_state = CommentEnd;
+ else if (cc == '>')
+ m_state = Data;
+ else
+ m_state = Comment;
+ break;
+ case Comment:
+ while (1) {
+ if (cc == '-') {
+ m_state = CommentEndDash;
+ break;
+ }
+ m_source.advance();
+ if (m_source.isEmpty())
+ return;
+ cc = *m_source;
+ }
+ break;
+ case CommentEndDash:
+ if (cc == '-')
+ m_state = CommentEnd;
+ else
+ m_state = Comment;
+ break;
+ case CommentEnd:
+ if (cc == '>')
+ m_state = Data;
+ else if (cc == '-')
+ ;
+ else
+ m_state = Comment;
+ break;
+ }
+ m_source.advance();
+ }
+}
+
+void LegacyPreloadScanner::processAttribute()
+{
+ AtomicString tag = AtomicString(m_tagName.data(), m_tagName.size());
+ AtomicString attribute = AtomicString(m_attributeName.data(), m_attributeName.size());
+
+ String value(m_attributeValue.data(), m_attributeValue.size());
+ if (tag == scriptTag || tag == imgTag) {
+ if (attribute == srcAttr && m_urlToLoad.isEmpty())
+ m_urlToLoad = deprecatedParseURL(value);
+ else if (attribute == charsetAttr)
+ m_charset = value;
+ } else if (tag == linkTag) {
+ if (attribute == hrefAttr && m_urlToLoad.isEmpty())
+ m_urlToLoad = deprecatedParseURL(value);
+ else if (attribute == relAttr) {
+ HTMLLinkElement::RelAttribute rel;
+ HTMLLinkElement::tokenizeRelAttribute(value, rel);
+ m_linkIsStyleSheet = rel.m_isStyleSheet && !rel.m_isAlternate && !rel.m_isIcon && !rel.m_isDNSPrefetch;
+ } else if (attribute == charsetAttr)
+ m_charset = value;
+ }
+}
+
+inline void LegacyPreloadScanner::emitCharacter(UChar c)
+{
+ if (m_contentModel == CDATA && m_lastStartTag == styleTag)
+ tokenizeCSS(c);
+}
+
+inline void LegacyPreloadScanner::tokenizeCSS(UChar c)
+{
+ // We are just interested in @import rules, no need for real tokenization here
+ // Searching for other types of resources is probably low payoff
+ switch (m_cssState) {
+ case CSSInitial:
+ if (c == '@')
+ m_cssState = CSSRuleStart;
+ else if (c == '/')
+ m_cssState = CSSMaybeComment;
+ break;
+ case CSSMaybeComment:
+ if (c == '*')
+ m_cssState = CSSComment;
+ else
+ m_cssState = CSSInitial;
+ break;
+ case CSSComment:
+ if (c == '*')
+ m_cssState = CSSMaybeCommentEnd;
+ break;
+ case CSSMaybeCommentEnd:
+ if (c == '/')
+ m_cssState = CSSInitial;
+ else if (c == '*')
+ ;
+ else
+ m_cssState = CSSComment;
+ break;
+ case CSSRuleStart:
+ if ((c >= 'A' && c <= 'Z') || (c >= 'a' && c <= 'z')) {
+ m_cssRule.clear();
+ m_cssRuleValue.clear();
+ m_cssRule.append(c);
+ m_cssState = CSSRule;
+ } else
+ m_cssState = CSSInitial;
+ break;
+ case CSSRule:
+ if (isWhitespace(c))
+ m_cssState = CSSAfterRule;
+ else if (c == ';')
+ m_cssState = CSSInitial;
+ else
+ m_cssRule.append(c);
+ break;
+ case CSSAfterRule:
+ if (isWhitespace(c))
+ ;
+ else if (c == ';')
+ m_cssState = CSSInitial;
+ else {
+ m_cssState = CSSRuleValue;
+ m_cssRuleValue.append(c);
+ }
+ break;
+ case CSSRuleValue:
+ if (isWhitespace(c))
+ m_cssState = CSSAfterRuleValue;
+ else if (c == ';') {
+ emitCSSRule();
+ m_cssState = CSSInitial;
+ } else
+ m_cssRuleValue.append(c);
+ break;
+ case CSSAfterRuleValue:
+ if (isWhitespace(c))
+ ;
+ else if (c == ';') {
+ emitCSSRule();
+ m_cssState = CSSInitial;
+ } else {
+ // FIXME media rules
+ m_cssState = CSSInitial;
+ }
+ break;
+ }
+}
+
+void LegacyPreloadScanner::emitTag()
+{
+ if (m_closeTag) {
+ m_contentModel = PCDATA;
+ m_cssState = CSSInitial;
+ clearLastCharacters();
+ return;
+ }
+
+ AtomicString tag(m_tagName.data(), m_tagName.size());
+ m_lastStartTag = tag;
+
+ if (tag == textareaTag || tag == titleTag)
+ m_contentModel = RCDATA;
+ else if (tag == styleTag || tag == xmpTag || tag == scriptTag || tag == iframeTag || tag == noembedTag || tag == noframesTag)
+ m_contentModel = CDATA;
+ else if (tag == noscriptTag)
+ // we wouldn't be here if scripts were disabled
+ m_contentModel = CDATA;
+ else if (tag == plaintextTag)
+ m_contentModel = PLAINTEXT;
+ else
+ m_contentModel = PCDATA;
+
+ if (tag == bodyTag)
+ m_bodySeen = true;
+
+ if (m_urlToLoad.isEmpty()) {
+ m_linkIsStyleSheet = false;
+ return;
+ }
+
+ if (tag == scriptTag)
+ m_document->docLoader()->preload(CachedResource::Script, m_urlToLoad, m_charset, scanningBody());
+ else if (tag == imgTag)
+ m_document->docLoader()->preload(CachedResource::ImageResource, m_urlToLoad, String(), scanningBody());
+ else if (tag == linkTag && m_linkIsStyleSheet)
+ m_document->docLoader()->preload(CachedResource::CSSStyleSheet, m_urlToLoad, m_charset, scanningBody());
+
+ m_urlToLoad = String();
+ m_charset = String();
+ m_linkIsStyleSheet = false;
+}
+
+void LegacyPreloadScanner::emitCSSRule()
+{
+ String rule(m_cssRule.data(), m_cssRule.size());
+ if (equalIgnoringCase(rule, "import") && !m_cssRuleValue.isEmpty()) {
+ String value(m_cssRuleValue.data(), m_cssRuleValue.size());
+ String url = deprecatedParseURL(value);
+ if (!url.isEmpty())
+ m_document->docLoader()->preload(CachedResource::CSSStyleSheet, url, String(), scanningBody());
+ }
+ m_cssRule.clear();
+ m_cssRuleValue.clear();
+}
+
+}