Edit

kc3-lang/libxml2/testSAX.c

Branch :

  • Show log

    Commit

  • Author : Daniel Veillard
    Date : 2002-03-20 19:24:21
    Hash : e50f3b5d
    Message : I wanted to see the real speed at the SAX interface after a little too * testSAX.c: I wanted to see the real speed at the SAX interface after a little too many Ximianer started complaining about the parser speed. added a --quiet option: paphio:~/XML -> ls -l db100000.xml -rw-rw-r-- 1 veillard www 20182040 Mar 20 10:30 db100000.xml paphio:~/XML -> time ./testSAX --quiet db100000.xml 3200006 callbacks generated real 0m1.270s Which means 16MBytes/s and 3Mcallback/s Daniel

  • testSAX.c
  • /*
     * testSAX.c : a small tester program for parsing using the SAX API.
     *
     * See Copyright for the status of this software.
     *
     * daniel@veillard.com
     */
    
    #include "libxml.h"
    
    #include <string.h>
    #include <stdarg.h>
    
    #ifdef HAVE_SYS_TYPES_H
    #include <sys/types.h>
    #endif
    #ifdef HAVE_SYS_STAT_H
    #include <sys/stat.h>
    #endif
    #ifdef HAVE_FCNTL_H
    #include <fcntl.h>
    #endif
    #ifdef HAVE_UNISTD_H
    #include <unistd.h>
    #endif
    #ifdef HAVE_STDLIB_H
    #include <stdlib.h>
    #endif
    #ifdef HAVE_STRING_H
    #include <string.h>
    #endif
    
    
    #include <libxml/globals.h>
    #include <libxml/xmlerror.h>
    #include <libxml/parser.h>
    #include <libxml/parserInternals.h> /* only for xmlNewInputFromFile() */
    #include <libxml/tree.h>
    #include <libxml/debugXML.h>
    #include <libxml/xmlmemory.h>
    
    static int debug = 0;
    static int copy = 0;
    static int recovery = 0;
    static int push = 0;
    static int speed = 0;
    static int noent = 0;
    static int quiet = 0;
    static int callbacks = 0;
    
    xmlSAXHandler emptySAXHandlerStruct = {
        NULL, /* internalSubset */
        NULL, /* isStandalone */
        NULL, /* hasInternalSubset */
        NULL, /* hasExternalSubset */
        NULL, /* resolveEntity */
        NULL, /* getEntity */
        NULL, /* entityDecl */
        NULL, /* notationDecl */
        NULL, /* attributeDecl */
        NULL, /* elementDecl */
        NULL, /* unparsedEntityDecl */
        NULL, /* setDocumentLocator */
        NULL, /* startDocument */
        NULL, /* endDocument */
        NULL, /* startElement */
        NULL, /* endElement */
        NULL, /* reference */
        NULL, /* characters */
        NULL, /* ignorableWhitespace */
        NULL, /* processingInstruction */
        NULL, /* comment */
        NULL, /* xmlParserWarning */
        NULL, /* xmlParserError */
        NULL, /* xmlParserError */
        NULL, /* getParameterEntity */
        NULL, /* cdataBlock; */
        NULL,  /* externalSubset; */
        1
    };
    
    xmlSAXHandlerPtr emptySAXHandler = &emptySAXHandlerStruct;
    extern xmlSAXHandlerPtr debugSAXHandler;
    
    /************************************************************************
     *									*
     *				Debug Handlers				*
     *									*
     ************************************************************************/
    
    /**
     * isStandaloneDebug:
     * @ctxt:  An XML parser context
     *
     * Is this document tagged standalone ?
     *
     * Returns 1 if true
     */
    static int
    isStandaloneDebug(void *ctx ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return(0);
        fprintf(stdout, "SAX.isStandalone()\n");
        return(0);
    }
    
    /**
     * hasInternalSubsetDebug:
     * @ctxt:  An XML parser context
     *
     * Does this document has an internal subset
     *
     * Returns 1 if true
     */
    static int
    hasInternalSubsetDebug(void *ctx ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return(0);
        fprintf(stdout, "SAX.hasInternalSubset()\n");
        return(0);
    }
    
    /**
     * hasExternalSubsetDebug:
     * @ctxt:  An XML parser context
     *
     * Does this document has an external subset
     *
     * Returns 1 if true
     */
    static int
    hasExternalSubsetDebug(void *ctx ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return(0);
        fprintf(stdout, "SAX.hasExternalSubset()\n");
        return(0);
    }
    
    /**
     * internalSubsetDebug:
     * @ctxt:  An XML parser context
     *
     * Does this document has an internal subset
     */
    static void
    internalSubsetDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name,
    	       const xmlChar *ExternalID, const xmlChar *SystemID)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.internalSubset(%s,", name);
        if (ExternalID == NULL)
    	fprintf(stdout, " ,");
        else
    	fprintf(stdout, " %s,", ExternalID);
        if (SystemID == NULL)
    	fprintf(stdout, " )\n");
        else
    	fprintf(stdout, " %s)\n", SystemID);
    }
    
    /**
     * externalSubsetDebug:
     * @ctxt:  An XML parser context
     *
     * Does this document has an external subset
     */
    static void
    externalSubsetDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name,
    	       const xmlChar *ExternalID, const xmlChar *SystemID)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.externalSubset(%s,", name);
        if (ExternalID == NULL)
    	fprintf(stdout, " ,");
        else
    	fprintf(stdout, " %s,", ExternalID);
        if (SystemID == NULL)
    	fprintf(stdout, " )\n");
        else
    	fprintf(stdout, " %s)\n", SystemID);
    }
    
    /**
     * resolveEntityDebug:
     * @ctxt:  An XML parser context
     * @publicId: The public ID of the entity
     * @systemId: The system ID of the entity
     *
     * Special entity resolver, better left to the parser, it has
     * more context than the application layer.
     * The default behaviour is to NOT resolve the entities, in that case
     * the ENTITY_REF nodes are built in the structure (and the parameter
     * values).
     *
     * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
     */
    static xmlParserInputPtr
    resolveEntityDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *publicId, const xmlChar *systemId)
    {
        callbacks++;
        if (quiet)
    	return(NULL);
        /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
    
        
        fprintf(stdout, "SAX.resolveEntity(");
        if (publicId != NULL)
    	fprintf(stdout, "%s", (char *)publicId);
        else
    	fprintf(stdout, " ");
        if (systemId != NULL)
    	fprintf(stdout, ", %s)\n", (char *)systemId);
        else
    	fprintf(stdout, ", )\n");
    /*********
        if (systemId != NULL) {
            return(xmlNewInputFromFile(ctxt, (char *) systemId));
        }
     *********/
        return(NULL);
    }
    
    /**
     * getEntityDebug:
     * @ctxt:  An XML parser context
     * @name: The entity name
     *
     * Get an entity by name
     *
     * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
     */
    static xmlEntityPtr
    getEntityDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name)
    {
        callbacks++;
        if (quiet)
    	return(NULL);
        fprintf(stdout, "SAX.getEntity(%s)\n", name);
        return(NULL);
    }
    
    /**
     * getParameterEntityDebug:
     * @ctxt:  An XML parser context
     * @name: The entity name
     *
     * Get a parameter entity by name
     *
     * Returns the xmlParserInputPtr
     */
    static xmlEntityPtr
    getParameterEntityDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name)
    {
        callbacks++;
        if (quiet)
    	return(NULL);
        fprintf(stdout, "SAX.getParameterEntity(%s)\n", name);
        return(NULL);
    }
    
    
    /**
     * entityDeclDebug:
     * @ctxt:  An XML parser context
     * @name:  the entity name 
     * @type:  the entity type 
     * @publicId: The public ID of the entity
     * @systemId: The system ID of the entity
     * @content: the entity value (without processing).
     *
     * An entity definition has been parsed
     */
    static void
    entityDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, int type,
              const xmlChar *publicId, const xmlChar *systemId, xmlChar *content)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.entityDecl(%s, %d, %s, %s, %s)\n",
                name, type, publicId, systemId, content);
    }
    
    /**
     * attributeDeclDebug:
     * @ctxt:  An XML parser context
     * @name:  the attribute name 
     * @type:  the attribute type 
     *
     * An attribute definition has been parsed
     */
    static void
    attributeDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *elem, const xmlChar *name,
                  int type, int def, const xmlChar *defaultValue,
    	      xmlEnumerationPtr tree ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return;
        if (defaultValue == NULL)
    	fprintf(stdout, "SAX.attributeDecl(%s, %s, %d, %d, NULL, ...)\n",
                elem, name, type, def);
        else
    	fprintf(stdout, "SAX.attributeDecl(%s, %s, %d, %d, %s, ...)\n",
                elem, name, type, def, defaultValue);
    }
    
    /**
     * elementDeclDebug:
     * @ctxt:  An XML parser context
     * @name:  the element name 
     * @type:  the element type 
     * @content: the element value (without processing).
     *
     * An element definition has been parsed
     */
    static void
    elementDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, int type,
    	    xmlElementContentPtr content ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.elementDecl(%s, %d, ...)\n",
                name, type);
    }
    
    /**
     * notationDeclDebug:
     * @ctxt:  An XML parser context
     * @name: The name of the notation
     * @publicId: The public ID of the entity
     * @systemId: The system ID of the entity
     *
     * What to do when a notation declaration has been parsed.
     */
    static void
    notationDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name,
    	     const xmlChar *publicId, const xmlChar *systemId)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.notationDecl(%s, %s, %s)\n",
                (char *) name, (char *) publicId, (char *) systemId);
    }
    
    /**
     * unparsedEntityDeclDebug:
     * @ctxt:  An XML parser context
     * @name: The name of the entity
     * @publicId: The public ID of the entity
     * @systemId: The system ID of the entity
     * @notationName: the name of the notation
     *
     * What to do when an unparsed entity declaration is parsed
     */
    static void
    unparsedEntityDeclDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name,
    		   const xmlChar *publicId, const xmlChar *systemId,
    		   const xmlChar *notationName)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.unparsedEntityDecl(%s, %s, %s, %s)\n",
                (char *) name, (char *) publicId, (char *) systemId,
    	    (char *) notationName);
    }
    
    /**
     * setDocumentLocatorDebug:
     * @ctxt:  An XML parser context
     * @loc: A SAX Locator
     *
     * Receive the document locator at startup, actually xmlDefaultSAXLocator
     * Everything is available on the context, so this is useless in our case.
     */
    static void
    setDocumentLocatorDebug(void *ctx ATTRIBUTE_UNUSED, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.setDocumentLocator()\n");
    }
    
    /**
     * startDocumentDebug:
     * @ctxt:  An XML parser context
     *
     * called when the document start being processed.
     */
    static void
    startDocumentDebug(void *ctx ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.startDocument()\n");
    }
    
    /**
     * endDocumentDebug:
     * @ctxt:  An XML parser context
     *
     * called when the document end has been detected.
     */
    static void
    endDocumentDebug(void *ctx ATTRIBUTE_UNUSED)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.endDocument()\n");
    }
    
    /**
     * startElementDebug:
     * @ctxt:  An XML parser context
     * @name:  The element name
     *
     * called when an opening tag has been processed.
     */
    static void
    startElementDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name, const xmlChar **atts)
    {
        int i;
    
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.startElement(%s", (char *) name);
        if (atts != NULL) {
            for (i = 0;(atts[i] != NULL);i++) {
    	    fprintf(stdout, ", %s='", atts[i++]);
    	    if (atts[i] != NULL)
    	        fprintf(stdout, "%s'", atts[i]);
    	}
        }
        fprintf(stdout, ")\n");
    }
    
    /**
     * endElementDebug:
     * @ctxt:  An XML parser context
     * @name:  The element name
     *
     * called when the end of an element has been detected.
     */
    static void
    endElementDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.endElement(%s)\n", (char *) name);
    }
    
    /**
     * charactersDebug:
     * @ctxt:  An XML parser context
     * @ch:  a xmlChar string
     * @len: the number of xmlChar
     *
     * receiving some chars from the parser.
     * Question: how much at a time ???
     */
    static void
    charactersDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch, int len)
    {
        char output[40];
        int i;
    
        callbacks++;
        if (quiet)
    	return;
        for (i = 0;(i<len) && (i < 30);i++)
    	output[i] = ch[i];
        output[i] = 0;
    
        fprintf(stdout, "SAX.characters(%s, %d)\n", output, len);
    }
    
    /**
     * referenceDebug:
     * @ctxt:  An XML parser context
     * @name:  The entity name
     *
     * called when an entity reference is detected. 
     */
    static void
    referenceDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *name)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.reference(%s)\n", name);
    }
    
    /**
     * ignorableWhitespaceDebug:
     * @ctxt:  An XML parser context
     * @ch:  a xmlChar string
     * @start: the first char in the string
     * @len: the number of xmlChar
     *
     * receiving some ignorable whitespaces from the parser.
     * Question: how much at a time ???
     */
    static void
    ignorableWhitespaceDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch, int len)
    {
        char output[40];
        int i;
    
        callbacks++;
        if (quiet)
    	return;
        for (i = 0;(i<len) && (i < 30);i++)
    	output[i] = ch[i];
        output[i] = 0;
        fprintf(stdout, "SAX.ignorableWhitespace(%s, %d)\n", output, len);
    }
    
    /**
     * processingInstructionDebug:
     * @ctxt:  An XML parser context
     * @target:  the target name
     * @data: the PI data's
     * @len: the number of xmlChar
     *
     * A processing instruction has been parsed.
     */
    static void
    processingInstructionDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *target,
                          const xmlChar *data)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.processingInstruction(%s, %s)\n",
                (char *) target, (char *) data);
    }
    
    /**
     * cdataBlockDebug:
     * @ctx: the user data (XML parser context)
     * @value:  The pcdata content
     * @len:  the block length
     *
     * called when a pcdata block has been parsed
     */
    static void
    cdataBlockDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *value, int len)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.pcdata(%.20s, %d)\n",
    	    (char *) value, len);
    }
    
    /**
     * commentDebug:
     * @ctxt:  An XML parser context
     * @value:  the comment content
     *
     * A comment has been parsed.
     */
    static void
    commentDebug(void *ctx ATTRIBUTE_UNUSED, const xmlChar *value)
    {
        callbacks++;
        if (quiet)
    	return;
        fprintf(stdout, "SAX.comment(%s)\n", value);
    }
    
    /**
     * warningDebug:
     * @ctxt:  An XML parser context
     * @msg:  the message to display/transmit
     * @...:  extra parameters for the message display
     *
     * Display and format a warning messages, gives file, line, position and
     * extra parameters.
     */
    static void
    warningDebug(void *ctx ATTRIBUTE_UNUSED, const char *msg, ...)
    {
        va_list args;
    
        callbacks++;
        if (quiet)
    	return;
        va_start(args, msg);
        fprintf(stdout, "SAX.warning: ");
        vfprintf(stdout, msg, args);
        va_end(args);
    }
    
    /**
     * errorDebug:
     * @ctxt:  An XML parser context
     * @msg:  the message to display/transmit
     * @...:  extra parameters for the message display
     *
     * Display and format a error messages, gives file, line, position and
     * extra parameters.
     */
    static void
    errorDebug(void *ctx ATTRIBUTE_UNUSED, const char *msg, ...)
    {
        va_list args;
    
        callbacks++;
        if (quiet)
    	return;
        va_start(args, msg);
        fprintf(stdout, "SAX.error: ");
        vfprintf(stdout, msg, args);
        va_end(args);
    }
    
    /**
     * fatalErrorDebug:
     * @ctxt:  An XML parser context
     * @msg:  the message to display/transmit
     * @...:  extra parameters for the message display
     *
     * Display and format a fatalError messages, gives file, line, position and
     * extra parameters.
     */
    static void
    fatalErrorDebug(void *ctx ATTRIBUTE_UNUSED, const char *msg, ...)
    {
        va_list args;
    
        callbacks++;
        if (quiet)
    	return;
        va_start(args, msg);
        fprintf(stdout, "SAX.fatalError: ");
        vfprintf(stdout, msg, args);
        va_end(args);
    }
    
    xmlSAXHandler debugSAXHandlerStruct = {
        internalSubsetDebug,
        isStandaloneDebug,
        hasInternalSubsetDebug,
        hasExternalSubsetDebug,
        resolveEntityDebug,
        getEntityDebug,
        entityDeclDebug,
        notationDeclDebug,
        attributeDeclDebug,
        elementDeclDebug,
        unparsedEntityDeclDebug,
        setDocumentLocatorDebug,
        startDocumentDebug,
        endDocumentDebug,
        startElementDebug,
        endElementDebug,
        referenceDebug,
        charactersDebug,
        ignorableWhitespaceDebug,
        processingInstructionDebug,
        commentDebug,
        warningDebug,
        errorDebug,
        fatalErrorDebug,
        getParameterEntityDebug,
        cdataBlockDebug,
        externalSubsetDebug,
        1
    };
    
    xmlSAXHandlerPtr debugSAXHandler = &debugSAXHandlerStruct;
    
    /************************************************************************
     *									*
     *				Debug					*
     *									*
     ************************************************************************/
    
    static void
    parseAndPrintFile(char *filename) {
        int res;
    
        if (push) {
    	FILE *f;
    
    	/*
    	 * Empty callbacks for checking
    	 */
    	f = fopen(filename, "r");
    	if (f != NULL) {
    	    int ret;
    	    char chars[10];
    	    xmlParserCtxtPtr ctxt;
    
    	    ret = fread(chars, 1, 4, f);
    	    if (ret > 0) {
    		ctxt = xmlCreatePushParserCtxt(emptySAXHandler, NULL,
    			    chars, ret, filename);
    		while ((ret = fread(chars, 1, 3, f)) > 0) {
    		    xmlParseChunk(ctxt, chars, ret, 0);
    		}
    		xmlParseChunk(ctxt, chars, 0, 1);
    		xmlFreeParserCtxt(ctxt);
    	    }
    	    fclose(f);
    	} else {
    	    xmlGenericError(xmlGenericErrorContext,
    		    "Cannot read file %s\n", filename);
    	}
    	/*
    	 * Debug callback
    	 */
    	f = fopen(filename, "r");
    	if (f != NULL) {
    	    int ret;
    	    char chars[10];
    	    xmlParserCtxtPtr ctxt;
    
    	    ret = fread(chars, 1, 4, f);
    	    if (ret > 0) {
    		ctxt = xmlCreatePushParserCtxt(debugSAXHandler, NULL,
    			    chars, ret, filename);
    		while ((ret = fread(chars, 1, 3, f)) > 0) {
    		    xmlParseChunk(ctxt, chars, ret, 0);
    		}
    		ret = xmlParseChunk(ctxt, chars, 0, 1);
    		xmlFreeParserCtxt(ctxt);
    		if (ret != 0) {
    		    fprintf(stdout,
    		            "xmlSAXUserParseFile returned error %d\n", ret);
    		}
    	    }
    	    fclose(f);
    	}
        } else {
    	if (!speed) {
    	    /*
    	     * Empty callbacks for checking
    	     */
    	    if (!quiet) {
    		res = xmlSAXUserParseFile(emptySAXHandler, NULL, filename);
    		if (res != 0) {
    		    fprintf(stdout, "xmlSAXUserParseFile returned error %d\n", res);
    		}
    	    }
    
    	    /*
    	     * Debug callback
    	     */
    	    callbacks = 0;
    	    res = xmlSAXUserParseFile(debugSAXHandler, NULL, filename);
    	    if (res != 0) {
    		fprintf(stdout, "xmlSAXUserParseFile returned error %d\n", res);
    	    }
    	    if (quiet)
    		fprintf(stdout, "%d callbacks generated\n", callbacks);
    	} else {
    	    /*
    	     * test 100x the SAX parse
    	     */
    	    int i;
    
    	    for (i = 0; i<100;i++)
    		res = xmlSAXUserParseFile(emptySAXHandler, NULL, filename);
    	    if (res != 0) {
    		fprintf(stdout, "xmlSAXUserParseFile returned error %d\n", res);
    	    }
    	}
        }
    }
    
    
    int main(int argc, char **argv) {
        int i;
        int files = 0;
    
        for (i = 1; i < argc ; i++) {
    	if ((!strcmp(argv[i], "-debug")) || (!strcmp(argv[i], "--debug")))
    	    debug++;
    	else if ((!strcmp(argv[i], "-copy")) || (!strcmp(argv[i], "--copy")))
    	    copy++;
    	else if ((!strcmp(argv[i], "-recover")) ||
    	         (!strcmp(argv[i], "--recover")))
    	    recovery++;
    	else if ((!strcmp(argv[i], "-push")) ||
    	         (!strcmp(argv[i], "--push")))
    	    push++;
    	else if ((!strcmp(argv[i], "-speed")) ||
    	         (!strcmp(argv[i], "--speed")))
    	    speed++;
    	else if ((!strcmp(argv[i], "-noent")) ||
    	         (!strcmp(argv[i], "--noent")))
    	    noent++;
    	else if ((!strcmp(argv[i], "-quiet")) ||
    	         (!strcmp(argv[i], "--quiet")))
    	    quiet++;
        }
        if (noent != 0) xmlSubstituteEntitiesDefault(1);
        for (i = 1; i < argc ; i++) {
    	if (argv[i][0] != '-') {
    	    parseAndPrintFile(argv[i]);
    	    files ++;
    	}
        }
        xmlCleanupParser();
        xmlMemoryDump();
    
        return(0);
    }