Staging
v0.5.1
https://github.com/python/cpython
Raw File
Tip revision: c48b055258cfc31d8043af9c427e7a0e2980e60d authored by Benjamin Peterson on 06 March 2010, 20:37:32 UTC
Merged revisions 78739 via svnmerge from
Tip revision: c48b055
elem_count.py
"""
A simple demo that reads in an XML document and displays the number of
elements and attributes as well as a tally of elements and attributes by name.
"""

import sys
from collections import defaultdict

from xml.sax import make_parser, handler

class FancyCounter(handler.ContentHandler):

    def __init__(self):
        self._elems = 0
        self._attrs = 0
        self._elem_types = defaultdict(int)
        self._attr_types = defaultdict(int)

    def startElement(self, name, attrs):
        self._elems += 1
        self._attrs += len(attrs)
        self._elem_types[name] += 1

        for name in attrs.keys():
            self._attr_types[name] += 1

    def endDocument(self):
        print("There were", self._elems, "elements.")
        print("There were", self._attrs, "attributes.")

        print("---ELEMENT TYPES")
        for pair in  self._elem_types.items():
            print("%20s %d" % pair)

        print("---ATTRIBUTE TYPES")
        for pair in  self._attr_types.items():
            print("%20s %d" % pair)

if __name__ == '__main__':
    parser = make_parser()
    parser.setContentHandler(FancyCounter())
    parser.parse(sys.argv[1])
back to top