/* This file is part of the KDE libraries Copyright (C) 1997 Martin Jones (mjones@kde.org) (C) 1997 Torben Weis (weis@kde.org) (C) 1998 Waldo Bastian (bastian@kde.org) (C) 1999 Lars Knoll (knoll@kde.org) Copyright (C) 2003 Apple Computer, Inc. This library is free software; you can redistribute it and/or modify it under the terms of the GNU Library General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This library is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU Library General Public License for more details. You should have received a copy of the GNU Library General Public License along with this library; see the file COPYING.LIB. If not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. */ //---------------------------------------------------------------------------- // // KDE HTML Widget -- HTML Parser #ifndef HTMLPARSER_H #define HTMLPARSER_H // 0 all // 1 domtree + rendertree + styleForElement, no layouting // 2 domtree only #define SPEED_DEBUG 0 #ifdef SPEED_DEBUG #include #endif #include "dom/dom_string.h" #include "xml/dom_nodeimpl.h" #include "html/html_documentimpl.h" class KHTMLView; class HTMLStackElem; namespace DOM { class HTMLDocumentImpl; class DocumentPtr; class HTMLElementImpl; class NodeImpl; class HTMLFormElementImpl; class HTMLMapElementImpl; class HTMLHeadElementImpl; class DocumentFragmentImpl; } namespace khtml { class Token; }; class KHTMLParser; /** * The parser for html. It receives a stream of tokens from the HTMLTokenizer, and * builds up the Document structure form it. */ class KHTMLParser { public: KHTMLParser( KHTMLView *w, DOM::DocumentPtr *i ); KHTMLParser( DOM::DocumentFragmentImpl *frag, DOM::DocumentPtr *doc ); virtual ~KHTMLParser(); /** * parses one token delivered by the tokenizer */ void parseToken(khtml::Token *_t); /** * tokenizer says it's not going to be sending us any more tokens */ void finished(); /** * resets the parser */ void reset(); bool skipMode() const { return (discard_until != 0); } bool noSpaces() const { return !inBody; } bool selectMode() const { return inSelect; } DOM::HTMLDocumentImpl *doc() const { return static_cast(document->document()); } DOM::DocumentPtr *docPtr() const { return document; } protected: void setCurrent(DOM::NodeImpl *newCurrent); KHTMLView *HTMLWidget; DOM::DocumentPtr *document; /* * generate an element from the token */ DOM::NodeImpl *getElement(khtml::Token *); void processCloseTag(khtml::Token *); bool insertNode(DOM::NodeImpl *n, bool flat = false); /* * The currently active element (the one new elements will be added to) */ DOM::NodeImpl *current; HTMLStackElem *blockStack; void pushBlock( int _id, int _level); void popBlock( int _id ); void popOneBlock(bool delBlock = true); void popInlineBlocks(); void freeBlock( void); void createHead(); bool isResidualStyleTag(int _id); bool isAffectedByResidualStyle(int _id); void handleResidualStyleCloseTagAcrossBlocks(HTMLStackElem* elem); void reopenResidualStyleTags(HTMLStackElem* elem, DOM::NodeImpl* malformedTableParent); bool allowNestedRedundantTag(int _id); ushort *forbiddenTag; /* * currently active form */ DOM::HTMLFormElementImpl *form; /* * current map */ DOM::HTMLMapElementImpl *map; /* * the head element. Needed for crappy html which defines after */ DOM::HTMLHeadElementImpl *head; /* * a possible element in the head. Compatibility hack for * html from the stone age */ DOM::NodeImpl *isindex; DOM::NodeImpl *handleIsindex( khtml::Token *t ); /* * inserts the stupid isIndex element. */ void startBody(); bool inBody; bool haveContent; bool haveFrameSet; bool end; bool inSelect; /* * tells the parser to discard all tags, until it reaches the one specified */ int discard_until; bool headLoaded; int inStrayTableContent; #if SPEED_DEBUG > 0 QTime qt; #endif }; #endif // HTMLPARSER_H