⇤ ← Revision 1 as of 2022-05-02 15:51:42
Size: 833
Comment:
|
Size: 833
Comment:
|
Deletions are marked like this. | Additions are marked like this. |
Line 1: | Line 1: |
= Python Xml Sax = | = Python XML SAX = |
Python XML SAX
Contents
Usage
from xml.sax import handler, make_parser class MyHandler(handler.ContentHandler): def __init__(self): handler.ContentHandler.__init__(self) self.in_page = False self.character_buffer = "" def startElement(self, name, attrs): if name == "page": self.in_page = True def endElement(self, name): if name == "page": self.in_page = False print(self.character_buffer) self.character_buffer = "" def characters(self, data): self.character_buffer += data def parse(filename): parser = make_parser() handler = MyHandler() parser.setContentHandler(handler) parser.parse(filename)