2000-06-29 16:33:43 -03:00
|
|
|
"""Simple API for XML (SAX) implementation for Python.
|
|
|
|
|
|
|
|
This module provides an implementation of the SAX 2 interface;
|
|
|
|
information about the Java version of the interface can be found at
|
|
|
|
http://www.megginson.com/SAX/. The Python version of the interface is
|
|
|
|
documented at <...>.
|
|
|
|
|
|
|
|
This package contains the following modules:
|
|
|
|
|
2000-09-18 13:31:08 -03:00
|
|
|
handler -- Base classes and constants which define the SAX 2 API for
|
|
|
|
the 'client-side' of SAX for Python.
|
2000-06-29 16:33:43 -03:00
|
|
|
|
2000-09-18 13:31:08 -03:00
|
|
|
saxutils -- Implementation of the convenience classes commonly used to
|
|
|
|
work with SAX.
|
2000-06-29 16:33:43 -03:00
|
|
|
|
2000-09-18 13:31:08 -03:00
|
|
|
xmlreader -- Base classes and constants which define the SAX 2 API for
|
|
|
|
the parsers used with SAX for Python.
|
|
|
|
|
2000-09-24 17:38:18 -03:00
|
|
|
expatreader -- Driver that allows use of the Expat parser with SAX.
|
2000-06-29 16:33:43 -03:00
|
|
|
"""
|
|
|
|
|
2000-09-24 15:54:49 -03:00
|
|
|
from xmlreader import InputSource
|
2000-07-01 10:44:04 -03:00
|
|
|
from handler import ContentHandler, ErrorHandler
|
|
|
|
from _exceptions import SAXException, SAXNotRecognizedException, \
|
2000-10-06 14:41:52 -03:00
|
|
|
SAXParseException, SAXNotSupportedException, \
|
|
|
|
SAXReaderNotAvailable
|
2000-09-18 13:31:08 -03:00
|
|
|
|
2000-07-01 01:58:47 -03:00
|
|
|
|
2000-09-24 15:54:49 -03:00
|
|
|
def parse(source, handler, errorHandler=ErrorHandler()):
|
2000-09-24 18:31:06 -03:00
|
|
|
parser = make_parser()
|
2000-09-18 13:31:08 -03:00
|
|
|
parser.setContentHandler(handler)
|
|
|
|
parser.setErrorHandler(errorHandler)
|
2000-09-24 15:54:49 -03:00
|
|
|
parser.parse(source)
|
2000-07-01 01:58:47 -03:00
|
|
|
|
2000-09-18 13:31:08 -03:00
|
|
|
def parseString(string, handler, errorHandler=ErrorHandler()):
|
2000-07-01 01:58:47 -03:00
|
|
|
try:
|
2000-09-18 13:31:08 -03:00
|
|
|
from cStringIO import StringIO
|
2000-07-01 01:58:47 -03:00
|
|
|
except ImportError:
|
2000-09-18 13:31:08 -03:00
|
|
|
from StringIO import StringIO
|
2000-10-23 15:09:50 -03:00
|
|
|
|
2000-09-18 13:31:08 -03:00
|
|
|
if errorHandler is None:
|
|
|
|
errorHandler = ErrorHandler()
|
2000-09-24 18:31:06 -03:00
|
|
|
parser = make_parser()
|
2000-09-18 13:31:08 -03:00
|
|
|
parser.setContentHandler(handler)
|
|
|
|
parser.setErrorHandler(errorHandler)
|
2000-09-24 15:54:49 -03:00
|
|
|
|
|
|
|
inpsrc = InputSource()
|
|
|
|
inpsrc.setByteStream(StringIO(string))
|
|
|
|
parser.parse(inpsrc)
|
2000-09-21 05:34:04 -03:00
|
|
|
|
|
|
|
# this is the parser list used by the make_parser function if no
|
|
|
|
# alternatives are given as parameters to the function
|
|
|
|
|
2006-07-29 13:56:15 -03:00
|
|
|
default_parser_list = ["xml.sax.expatreader"]
|
2000-09-21 05:34:04 -03:00
|
|
|
|
2001-07-31 05:54:55 -03:00
|
|
|
# tell modulefinder that importing sax potentially imports expatreader
|
|
|
|
_false = 0
|
|
|
|
if _false:
|
2006-07-29 13:56:15 -03:00
|
|
|
import xml.sax.expatreader
|
2001-07-31 05:54:55 -03:00
|
|
|
|
2002-05-31 17:46:39 -03:00
|
|
|
import os, sys
|
2000-09-21 05:34:04 -03:00
|
|
|
if os.environ.has_key("PY_SAX_PARSER"):
|
2002-05-31 17:46:39 -03:00
|
|
|
default_parser_list = os.environ["PY_SAX_PARSER"].split(",")
|
2000-09-21 05:34:04 -03:00
|
|
|
del os
|
|
|
|
|
|
|
|
_key = "python.xml.sax.parser"
|
|
|
|
if sys.platform[:4] == "java" and sys.registry.containsKey(_key):
|
2002-05-31 17:46:39 -03:00
|
|
|
default_parser_list = sys.registry.getProperty(_key).split(",")
|
2000-10-23 15:09:50 -03:00
|
|
|
|
|
|
|
|
2000-09-21 05:34:04 -03:00
|
|
|
def make_parser(parser_list = []):
|
|
|
|
"""Creates and returns a SAX parser.
|
|
|
|
|
|
|
|
Creates the first parser it is able to instantiate of the ones
|
|
|
|
given in the list created by doing parser_list +
|
|
|
|
default_parser_list. The lists must contain the names of Python
|
|
|
|
modules containing both a SAX parser and a create_parser function."""
|
|
|
|
|
|
|
|
for parser_name in parser_list + default_parser_list:
|
|
|
|
try:
|
2000-09-22 02:07:56 -03:00
|
|
|
return _create_parser(parser_name)
|
2000-09-21 05:34:04 -03:00
|
|
|
except ImportError,e:
|
2000-10-06 14:41:52 -03:00
|
|
|
import sys
|
|
|
|
if sys.modules.has_key(parser_name):
|
|
|
|
# The parser module was found, but importing it
|
|
|
|
# failed unexpectedly, pass this exception through
|
|
|
|
raise
|
|
|
|
except SAXReaderNotAvailable:
|
|
|
|
# The parser module detected that it won't work properly,
|
|
|
|
# so try the next one
|
2000-09-21 05:34:04 -03:00
|
|
|
pass
|
|
|
|
|
2000-10-23 15:09:50 -03:00
|
|
|
raise SAXReaderNotAvailable("No parsers found", None)
|
|
|
|
|
2000-09-21 05:34:04 -03:00
|
|
|
# --- Internal utility methods used by make_parser
|
|
|
|
|
|
|
|
if sys.platform[ : 4] == "java":
|
|
|
|
def _create_parser(parser_name):
|
2000-09-22 06:30:29 -03:00
|
|
|
from org.python.core import imp
|
|
|
|
drv_module = imp.importName(parser_name, 0, globals())
|
|
|
|
return drv_module.create_parser()
|
2000-09-21 05:34:04 -03:00
|
|
|
|
|
|
|
else:
|
|
|
|
def _create_parser(parser_name):
|
2000-09-24 18:31:06 -03:00
|
|
|
drv_module = __import__(parser_name,{},{},['create_parser'])
|
2000-09-22 06:30:29 -03:00
|
|
|
return drv_module.create_parser()
|
2000-09-21 05:34:04 -03:00
|
|
|
|
|
|
|
del sys
|