/* * Copyright (C) 2000 Peter Kelly (pmk@post.com) * Copyright (C) 2005, 2006, 2007 Apple Inc. All rights reserved. * Copyright (C) 2007 Samuel Weinig (sam@webkit.org) * Copyright (C) 2008 Nokia Corporation and/or its subsidiary(-ies) * Copyright (C) 2008, 2009 Torch Mobile Inc. All rights reserved. (http://www.torchmobile.com/) * * This library is free software; you can redistribute it and/or * modify it under the terms of the GNU Library General Public * License as published by the Free Software Foundation; either * version 2 of the License, or (at your option) any later version. * * This library is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * Library General Public License for more details. * * You should have received a copy of the GNU Library General Public License * along with this library; see the file COPYING.LIB. If not, write to * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, * Boston, MA 02110-1301, USA. * */ #ifndef XMLTokenizer_h #define XMLTokenizer_h #if USE(EXPAT) #include "CachedResourceClient.h" #include "SegmentedString.h" #include "StringHash.h" #include "Tokenizer.h" #include #include #include namespace WebCore { class Node; class CachedScript; class DocumentFragment; class Document; class Element; class FrameView; class PendingCallbacks; class XMLTokenizer : public Tokenizer, public CachedResourceClient { public: XMLTokenizer(Document *, FrameView * = 0); XMLTokenizer(DocumentFragment *, Element *); ~XMLTokenizer(); enum ErrorType { warning, nonFatal, fatal }; // from Tokenizer virtual bool write(const SegmentedString &str, bool); virtual void finish(); virtual bool isWaitingForScripts() const; virtual void stopParsing(); virtual bool wellFormed() const { return !m_sawError; } virtual int lineNumber() const; virtual int columnNumber() const; // from CachedObjectClient virtual void notifyFinished(CachedResource *finishedObj); // callbacks from parser expat void startElementNs(const XML_Char *name, const XML_Char **atts); void endElementNs(); void characters(const XML_Char *s, int len); void processingInstruction(const XML_Char *target, const XML_Char *data); void comment(const XML_Char *s); void startCdata(); void endCdata(); void error(ErrorType type, const char* m, int lineNumber, int columnNumber); // utilities XML_Parser getXMLParser() const { return m_parser; } void setXMLParser(XML_Parser parser) { m_parser = parser; } private: void setCurrentNode(Node*); void end(); void pauseParsing(); void resumeParsing(); void reportError(); void insertErrorMessageBlock(); bool enterText(); void exitText(); Document *m_doc; FrameView *m_view; XML_Parser m_parser; Node *m_currentNode; bool m_currentNodeIsReferenced; bool m_sawError; bool m_sawXSLTransform; bool m_sawFirstElement; bool m_parserPaused; bool m_requestingScript; bool m_finishCalled; int m_errorCount; String m_errorMessages; CachedScript *m_pendingScript; RefPtr m_scriptElement; int m_scriptStartLine; bool m_parsingFragment; String m_defaultNamespaceURI; typedef HashMap PrefixForNamespaceMap; PrefixForNamespaceMap m_prefixToNamespaceMap; OwnPtr m_pendingCallbacks; SegmentedString m_pendingSrc; }; HashMap parseAttributes(const String&, bool& attrsOK); bool parseXMLDocumentFragment(const String&, DocumentFragment*, Element* parent = 0); } // namespace WebCore #else // USE(EXPAT) #include "CachedResourceClient.h" #include "CachedResourceHandle.h" #include "SegmentedString.h" #include "StringHash.h" #include "Tokenizer.h" #include #include #if USE(QXMLSTREAM) #include #else #include #include #endif namespace WebCore { class Node; class CachedScript; class DocLoader; class DocumentFragment; class Document; class Element; class FrameView; class PendingCallbacks; class ScriptElement; class XMLTokenizer : public Tokenizer, public CachedResourceClient { public: XMLTokenizer(Document*, FrameView* = 0); XMLTokenizer(DocumentFragment*, Element*); ~XMLTokenizer(); enum ErrorType { warning, nonFatal, fatal }; // from Tokenizer virtual void write(const SegmentedString&, bool appendData); virtual void finish(); virtual bool isWaitingForScripts() const; virtual void stopParsing(); void end(); void pauseParsing(); void resumeParsing(); void setIsXHTMLDocument(bool isXHTML) { m_isXHTMLDocument = isXHTML; } bool isXHTMLDocument() const { return m_isXHTMLDocument; } #if ENABLE(XHTMLMP) void setIsXHTMLMPDocument(bool isXHTML) { m_isXHTMLMPDocument = isXHTML; } bool isXHTMLMPDocument() const { return m_isXHTMLMPDocument; } #endif #if ENABLE(WML) bool isWMLDocument() const; #endif // from CachedResourceClient virtual void notifyFinished(CachedResource* finishedObj); void handleError(ErrorType type, const char* m, int lineNumber, int columnNumber); virtual bool wellFormed() const { return !m_sawError; } int lineNumber() const; int columnNumber() const; #if USE(QXMLSTREAM) private: void parse(); void startDocument(); void parseStartElement(); void parseEndElement(); void parseCharacters(); void parseProcessingInstruction(); void parseCdata(); void parseComment(); void endDocument(); void parseDtd(); bool hasError() const; #else public: // callbacks from parser SAX void error(ErrorType, const char* message, va_list args) WTF_ATTRIBUTE_PRINTF(3, 0); void startElementNs(const xmlChar* xmlLocalName, const xmlChar* xmlPrefix, const xmlChar* xmlURI, int nb_namespaces, const xmlChar** namespaces, int nb_attributes, int nb_defaulted, const xmlChar** libxmlAttributes); void endElementNs(); void characters(const xmlChar* s, int len); void processingInstruction(const xmlChar* target, const xmlChar* data); void cdataBlock(const xmlChar* s, int len); void comment(const xmlChar* s); void startDocument(const xmlChar* version, const xmlChar* encoding, int standalone); void internalSubset(const xmlChar* name, const xmlChar* externalID, const xmlChar* systemID); void endDocument(); #endif private: friend bool parseXMLDocumentFragment(const String& chunk, DocumentFragment* fragment, Element* parent); void initializeParserContext(const char* chunk = 0); void setCurrentNode(Node*); void insertErrorMessageBlock(); bool enterText(); void exitText(); void doWrite(const String&); void doEnd(); Document* m_doc; FrameView* m_view; String m_originalSourceForTransform; #if USE(QXMLSTREAM) QXmlStreamReader m_stream; bool m_wroteText; #else xmlParserCtxtPtr m_context; OwnPtr m_pendingCallbacks; Vector m_bufferedText; #endif Node* m_currentNode; bool m_currentNodeIsReferenced; bool m_sawError; bool m_sawXSLTransform; bool m_sawFirstElement; bool m_isXHTMLDocument; #if ENABLE(XHTMLMP) bool m_isXHTMLMPDocument; bool m_hasDocTypeDeclaration; #endif bool m_parserPaused; bool m_requestingScript; bool m_finishCalled; int m_errorCount; int m_lastErrorLine; int m_lastErrorColumn; String m_errorMessages; CachedResourceHandle m_pendingScript; RefPtr m_scriptElement; int m_scriptStartLine; bool m_parsingFragment; String m_defaultNamespaceURI; typedef HashMap PrefixForNamespaceMap; PrefixForNamespaceMap m_prefixToNamespaceMap; SegmentedString m_pendingSrc; }; #if ENABLE(XSLT) void* xmlDocPtrForString(DocLoader*, const String& source, const String& url); #endif HashMap parseAttributes(const String&, bool& attrsOK); bool parseXMLDocumentFragment(const String&, DocumentFragment*, Element* parent = 0); } // namespace WebCore #endif // USE(EXPAT) #endif // XMLTokenizer_h