Python XML SAX
xml.sax is a module for parsing XML.
This parser uses the SAX (Simple API for XML) API.
Contents
Usage
from xml.sax import handler, make_parser class MyHandler(handler.ContentHandler): def __init__(self): handler.ContentHandler.__init__(self) self.in_page = False self.character_buffer = "" def startElement(self, name, attrs): if name == "page": self.in_page = True def endElement(self, name): if name == "page": self.in_page = False print(self.character_buffer) self.character_buffer = "" def characters(self, data): self.character_buffer += data def parse(filename): parser = make_parser() handler = MyHandler() parser.setContentHandler(handler) parser.parse(filename)
See also
Python xml.sax module documentation