Staging
v0.8.1
Revision 5a607a3ee5e81bdcef3f886f9d20c1376a533df4 authored by Mark Hammond on 06 May 2009, 08:04:54 UTC, committed by Mark Hammond on 06 May 2009, 08:04:54 UTC
By Larry Hastings, reviewed eric.smith and mark.hammond.
1 parent 9348901
Raw File
elem_count.py
import sys

from xml.sax import make_parser, handler

class FancyCounter(handler.ContentHandler):

    def __init__(self):
        self._elems = 0
        self._attrs = 0
        self._elem_types = {}
        self._attr_types = {}

    def startElement(self, name, attrs):
        self._elems = self._elems + 1
        self._attrs = self._attrs + len(attrs)
        self._elem_types[name] = self._elem_types.get(name, 0) + 1

        for name in attrs.keys():
            self._attr_types[name] = self._attr_types.get(name, 0) + 1

    def endDocument(self):
        print("There were", self._elems, "elements.")
        print("There were", self._attrs, "attributes.")

        print("---ELEMENT TYPES")
        for pair in  self._elem_types.items():
            print("%20s %d" % pair)

        print("---ATTRIBUTE TYPES")
        for pair in  self._attr_types.items():
            print("%20s %d" % pair)


parser = make_parser()
parser.setContentHandler(FancyCounter())
parser.parse(sys.argv[1])
back to top