2000-03-10 19:17:24 -04:00
|
|
|
""" Standard "encodings" Package
|
|
|
|
|
|
|
|
Standard Python encoding modules are stored in this package
|
|
|
|
directory.
|
|
|
|
|
|
|
|
Codec modules must have names corresponding to standard lower-case
|
2002-02-11 13:43:46 -04:00
|
|
|
encoding names with hyphens mapped to underscores, e.g. 'utf-8' is
|
|
|
|
implemented by the module 'utf_8.py'.
|
2000-03-10 19:17:24 -04:00
|
|
|
|
|
|
|
Each codec module must export the following interface:
|
|
|
|
|
|
|
|
* getregentry() -> (encoder, decoder, stream_reader, stream_writer)
|
|
|
|
The getregentry() API must return callable objects which adhere to
|
|
|
|
the Python Codec Interface Standard.
|
|
|
|
|
|
|
|
In addition, a module may optionally also define the following
|
|
|
|
APIs which are then used by the package's codec search function:
|
|
|
|
|
|
|
|
* getaliases() -> sequence of encoding name strings to use as aliases
|
|
|
|
|
2000-12-12 10:45:35 -04:00
|
|
|
Alias names returned by getaliases() must be standard encoding
|
|
|
|
names as defined above (lower-case, hyphens converted to
|
|
|
|
underscores).
|
2000-03-10 19:17:24 -04:00
|
|
|
|
|
|
|
Written by Marc-Andre Lemburg (mal@lemburg.com).
|
|
|
|
|
|
|
|
(c) Copyright CNRI, All Rights Reserved. NO WARRANTY.
|
|
|
|
|
|
|
|
"""#"
|
|
|
|
|
2002-02-10 17:36:20 -04:00
|
|
|
import codecs,exceptions
|
2000-03-10 19:17:24 -04:00
|
|
|
|
|
|
|
_cache = {}
|
2000-03-20 12:36:48 -04:00
|
|
|
_unknown = '--unknown--'
|
2002-02-10 17:36:20 -04:00
|
|
|
_import_tail = ['*']
|
2000-03-10 19:17:24 -04:00
|
|
|
|
2001-09-19 08:52:07 -03:00
|
|
|
class CodecRegistryError(exceptions.LookupError,
|
|
|
|
exceptions.SystemError):
|
|
|
|
pass
|
|
|
|
|
2000-03-10 19:17:24 -04:00
|
|
|
def search_function(encoding):
|
|
|
|
|
|
|
|
# Cache lookup
|
2002-02-10 17:36:20 -04:00
|
|
|
entry = _cache.get(encoding, _unknown)
|
2000-03-20 12:36:48 -04:00
|
|
|
if entry is not _unknown:
|
2000-03-10 19:17:24 -04:00
|
|
|
return entry
|
|
|
|
|
2002-02-10 17:36:20 -04:00
|
|
|
# Import the module:
|
|
|
|
#
|
|
|
|
# First look in the encodings package, then try to lookup the
|
|
|
|
# encoding in the aliases mapping and retry the import using the
|
|
|
|
# default import module lookup scheme with the alias name.
|
|
|
|
#
|
2000-06-13 09:04:05 -03:00
|
|
|
modname = encoding.replace('-', '_')
|
2000-03-10 19:17:24 -04:00
|
|
|
try:
|
2002-02-10 17:36:20 -04:00
|
|
|
mod = __import__('encodings.' + modname,
|
|
|
|
globals(), locals(), _import_tail)
|
2000-03-10 19:17:24 -04:00
|
|
|
except ImportError,why:
|
2002-02-10 17:36:20 -04:00
|
|
|
import aliases
|
2002-02-11 13:43:46 -04:00
|
|
|
modname = aliases.aliases.get(modname, modname)
|
|
|
|
try:
|
|
|
|
mod = __import__(modname, globals(), locals(), _import_tail)
|
|
|
|
except ImportError,why:
|
2002-02-10 17:36:20 -04:00
|
|
|
mod = None
|
|
|
|
if mod is None:
|
2002-02-11 13:43:46 -04:00
|
|
|
# Cache misses
|
2000-03-10 19:17:24 -04:00
|
|
|
_cache[encoding] = None
|
|
|
|
return None
|
2002-02-10 17:36:20 -04:00
|
|
|
|
2000-03-10 19:17:24 -04:00
|
|
|
|
|
|
|
# Now ask the module for the registry entry
|
|
|
|
try:
|
|
|
|
entry = tuple(mod.getregentry())
|
|
|
|
except AttributeError:
|
|
|
|
entry = ()
|
|
|
|
if len(entry) != 4:
|
2001-09-19 08:52:07 -03:00
|
|
|
raise CodecRegistryError,\
|
|
|
|
'module "%s" (%s) failed to register' % \
|
|
|
|
(mod.__name__, mod.__file__)
|
2000-03-10 19:17:24 -04:00
|
|
|
for obj in entry:
|
|
|
|
if not callable(obj):
|
2001-09-19 08:52:07 -03:00
|
|
|
raise CodecRegistryError,\
|
|
|
|
'incompatible codecs in module "%s" (%s)' % \
|
|
|
|
(mod.__name__, mod.__file__)
|
2000-03-10 19:17:24 -04:00
|
|
|
|
2000-12-12 10:45:35 -04:00
|
|
|
# Cache the codec registry entry
|
2000-03-10 19:17:24 -04:00
|
|
|
_cache[encoding] = entry
|
2000-12-12 10:45:35 -04:00
|
|
|
|
|
|
|
# Register its aliases (without overwriting previously registered
|
|
|
|
# aliases)
|
2000-03-10 19:17:24 -04:00
|
|
|
try:
|
|
|
|
codecaliases = mod.getaliases()
|
|
|
|
except AttributeError:
|
|
|
|
pass
|
|
|
|
else:
|
2002-02-10 17:36:20 -04:00
|
|
|
import aliases
|
2000-03-10 19:17:24 -04:00
|
|
|
for alias in codecaliases:
|
2000-12-12 10:45:35 -04:00
|
|
|
if not aliases.aliases.has_key(alias):
|
|
|
|
aliases.aliases[alias] = modname
|
|
|
|
|
|
|
|
# Return the registry entry
|
2000-03-10 19:17:24 -04:00
|
|
|
return entry
|
|
|
|
|
|
|
|
# Register the search_function in the Python codec registry
|
|
|
|
codecs.register(search_function)
|