Edit

kc3-lang/libxml2/HTMLparser.h

Branch :

  • Show log

    Commit

  • Author : Daniel Veillard
    Date : 2001-03-24 17:00:36
    Hash : 56a4cb8c
    Message : Huge cleanup, I switched to compile with -Wall -g -O -ansi -pedantic -W -Wunused -Wimplicit -Wreturn-type -Wswitch -Wcomment -Wtrigraphs -Wformat -Wchar-subscripts -Wuninitialized -Wparentheses -Wshadow -Wpointer-arith -Wcast-align -Wwrite-strings -Waggregate-return -Wstrict-prototypes -Wmissing-prototypes -Wnested-externs -Winline - HTMLparser.[ch] HTMLtree.c SAX.c debugXML.c encoding.[ch] encoding.h entities.c error.c list.[ch] nanoftp.c nanohttp.c parser.[ch] parserInternals.[ch] testHTML.c testSAX.c testURI.c testXPath.c tree.[ch] uri.c valid.[ch] xinclude.c xmlIO.[ch] xmllint.c xmlmemory.c xpath.c xpathInternals.h xpointer.[ch] example/gjobread.c: Cleanup, staticfied a number of non-exported functions, detected and cleaned up a dozen of problem found this way, avoided a lot of public function name/typedef/system names clashes - doc/xml.html: updated - configure.in: switched private flags to the really pedantic ones. Daniel

  • HTMLparser.h
  • /*
     * HTMLparser.h : inf=terface for an HTML 4.0 non-verifying parser
     *
     * See Copyright for the status of this software.
     *
     * Daniel.Veillard@w3.org
     */
    
    #ifndef __HTML_PARSER_H__
    #define __HTML_PARSER_H__
    #include <libxml/parser.h>
    
    #ifdef __cplusplus
    extern "C" {
    #endif
    
    /*
     * Most of the back-end structures from XML and HTML are shared
     */
    typedef xmlParserCtxt htmlParserCtxt;
    typedef xmlParserCtxtPtr htmlParserCtxtPtr;
    typedef xmlParserNodeInfo htmlParserNodeInfo;
    typedef xmlSAXHandler htmlSAXHandler;
    typedef xmlSAXHandlerPtr htmlSAXHandlerPtr;
    typedef xmlParserInput htmlParserInput;
    typedef xmlParserInputPtr htmlParserInputPtr;
    typedef xmlDocPtr htmlDocPtr;
    typedef xmlNodePtr htmlNodePtr;
    
    /*
     * Internal description of an HTML element
     */
    typedef struct _htmlElemDesc htmlElemDesc;
    typedef htmlElemDesc *htmlElemDescPtr;
    struct _htmlElemDesc {
        const char *name;	/* The tag name */
        char startTag;       /* Whether the start tag can be implied */
        char endTag;         /* Whether the end tag can be implied */
        char saveEndTag;     /* Whether the end tag should be saved */
        char empty;          /* Is this an empty element ? */
        char depr;           /* Is this a deprecated element ? */
        char dtd;            /* 1: only in Loose DTD, 2: only Frameset one */
        const char *desc;   /* the description */
    };
    
    /*
     * Internal description of an HTML entity
     */
    typedef struct _htmlEntityDesc htmlEntityDesc;
    typedef htmlEntityDesc *htmlEntityDescPtr;
    struct _htmlEntityDesc {
        unsigned int value;	/* the UNICODE value for the character */
        const char *name;	/* The entity name */
        const char *desc;   /* the description */
    };
    
    /*
     * There is only few public functions.
     */
    htmlElemDescPtr		htmlTagLookup	(const xmlChar *tag);
    htmlEntityDescPtr	htmlEntityLookup(const xmlChar *name);
    htmlEntityDescPtr	htmlEntityValueLookup(unsigned int value);
    
    int			htmlIsAutoClosed(htmlDocPtr doc,
    					 htmlNodePtr elem);
    int			htmlAutoCloseTag(htmlDocPtr doc,
    					 const xmlChar *name,
    					 htmlNodePtr elem);
    htmlEntityDescPtr	htmlParseEntityRef(htmlParserCtxtPtr ctxt,
    					 xmlChar **str);
    int			htmlParseCharRef(htmlParserCtxtPtr ctxt);
    void			htmlParseElement(htmlParserCtxtPtr ctxt);
    
    htmlDocPtr		htmlSAXParseDoc	(xmlChar *cur,
    					 const char *encoding,
    					 htmlSAXHandlerPtr sax,
    					 void *userData);
    htmlDocPtr		htmlParseDoc	(xmlChar *cur,
    					 const char *encoding);
    htmlDocPtr		htmlSAXParseFile(const char *filename,
    					 const char *encoding,
    					 htmlSAXHandlerPtr sax,
    					 void *userData);
    htmlDocPtr		htmlParseFile	(const char *filename,
    					 const char *encoding);
    int			UTF8ToHtml	(unsigned char* out,
    					 int *outlen,
    					 const unsigned char* in,
    					 int *inlen);
    int			htmlEncodeEntities(unsigned char* out,
    					 int *outlen,
    					 const unsigned char* in,
    					 int *inlen, int quoteChar);
    int			htmlIsScriptAttribute(const xmlChar *name);
    int			htmlHandleOmittedElem(int val);
    
    /**
     * Interfaces for the Push mode
     */
    void			htmlFreeParserCtxt	(htmlParserCtxtPtr ctxt);
    htmlParserCtxtPtr	htmlCreatePushParserCtxt(htmlSAXHandlerPtr sax,
    						 void *user_data,
    						 const char *chunk,
    						 int size,
    						 const char *filename,
    						 xmlCharEncoding enc);
    int			htmlParseChunk		(htmlParserCtxtPtr ctxt,
    						 const char *chunk,
    						 int size,
    						 int terminate);
    #ifdef __cplusplus
    }
    #endif
    
    #endif /* __HTML_PARSER_H__ */