Python XML SAX
Contents
Usage
from xml.sax import handler, make_parser
class MyHandler(handler.ContentHandler):
def __init__(self):
handler.ContentHandler.__init__(self)
self.in_page = False
self.character_buffer = ""
def startElement(self, name, attrs):
if name == "page":
self.in_page = True
def endElement(self, name):
if name == "page":
self.in_page = False
print(self.character_buffer)
self.character_buffer = ""
def characters(self, data):
self.character_buffer += data
def parse(filename):
parser = make_parser()
handler = MyHandler()
parser.setContentHandler(handler)
parser.parse(filename)