2000-05-08 14:31:04 -03:00
|
|
|
"""A readline()-style interface to the parts of a multipart message.
|
|
|
|
|
|
|
|
The MultiFile class makes each part of a multipart message "feel" like
|
|
|
|
an ordinary file, as long as you use fp.readline(). Allows recursive
|
|
|
|
use, for nested multipart messages. Probably best used together
|
|
|
|
with module mimetools.
|
|
|
|
|
|
|
|
Suggested use:
|
|
|
|
|
|
|
|
real_fp = open(...)
|
|
|
|
fp = MultiFile(real_fp)
|
|
|
|
|
|
|
|
"read some lines from fp"
|
|
|
|
fp.push(separator)
|
|
|
|
while 1:
|
|
|
|
"read lines from fp until it returns an empty string" (A)
|
|
|
|
if not fp.next(): break
|
|
|
|
fp.pop()
|
|
|
|
"read remaining lines from fp until it returns an empty string"
|
|
|
|
|
|
|
|
The latter sequence may be used recursively at (A).
|
|
|
|
It is also allowed to use multiple push()...pop() sequences.
|
|
|
|
|
2000-07-16 09:04:32 -03:00
|
|
|
If seekable is given as 0, the class code will not do the bookkeeping
|
2000-05-08 14:31:04 -03:00
|
|
|
it normally attempts in order to make seeks relative to the beginning of the
|
|
|
|
current file part. This may be useful when using MultiFile with a non-
|
|
|
|
seekable stream object.
|
|
|
|
"""
|
1996-07-22 12:23:25 -03:00
|
|
|
|
|
|
|
import sys
|
|
|
|
import string
|
|
|
|
|
|
|
|
Error = 'multifile.Error'
|
|
|
|
|
|
|
|
class MultiFile:
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1998-08-11 23:38:11 -03:00
|
|
|
seekable = 0
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1998-08-11 23:38:11 -03:00
|
|
|
def __init__(self, fp, seekable=1):
|
1996-07-22 12:23:25 -03:00
|
|
|
self.fp = fp
|
|
|
|
self.stack = [] # Grows down
|
|
|
|
self.level = 0
|
|
|
|
self.last = 0
|
1998-08-11 23:38:11 -03:00
|
|
|
if seekable:
|
|
|
|
self.seekable = 1
|
|
|
|
self.start = self.fp.tell()
|
|
|
|
self.posstack = [] # Grows down
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1996-07-22 12:23:25 -03:00
|
|
|
def tell(self):
|
|
|
|
if self.level > 0:
|
|
|
|
return self.lastpos
|
|
|
|
return self.fp.tell() - self.start
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1998-03-26 18:14:20 -04:00
|
|
|
def seek(self, pos, whence=0):
|
|
|
|
here = self.tell()
|
|
|
|
if whence:
|
|
|
|
if whence == 1:
|
|
|
|
pos = pos + here
|
|
|
|
elif whence == 2:
|
|
|
|
if self.level > 0:
|
|
|
|
pos = pos + self.lastpos
|
|
|
|
else:
|
|
|
|
raise Error, "can't use whence=2 yet"
|
|
|
|
if not 0 <= pos <= here or \
|
1996-07-22 12:23:25 -03:00
|
|
|
self.level > 0 and pos > self.lastpos:
|
|
|
|
raise Error, 'bad MultiFile.seek() call'
|
|
|
|
self.fp.seek(pos + self.start)
|
|
|
|
self.level = 0
|
|
|
|
self.last = 0
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1996-07-22 12:23:25 -03:00
|
|
|
def readline(self):
|
1998-08-11 23:38:11 -03:00
|
|
|
if self.level > 0:
|
|
|
|
return ''
|
1996-07-22 12:23:25 -03:00
|
|
|
line = self.fp.readline()
|
1998-08-11 23:38:11 -03:00
|
|
|
# Real EOF?
|
1996-07-22 12:23:25 -03:00
|
|
|
if not line:
|
|
|
|
self.level = len(self.stack)
|
|
|
|
self.last = (self.level > 0)
|
|
|
|
if self.last:
|
1998-08-11 23:38:11 -03:00
|
|
|
raise Error, 'sudden EOF in MultiFile.readline()'
|
1996-07-22 12:23:25 -03:00
|
|
|
return ''
|
1998-08-11 23:38:11 -03:00
|
|
|
assert self.level == 0
|
|
|
|
# Fast check to see if this is just data
|
|
|
|
if self.is_data(line):
|
|
|
|
return line
|
|
|
|
else:
|
|
|
|
# Ignore trailing whitespace on marker lines
|
|
|
|
k = len(line) - 1;
|
|
|
|
while line[k] in string.whitespace:
|
|
|
|
k = k - 1
|
|
|
|
marker = line[:k+1]
|
|
|
|
# No? OK, try to match a boundary.
|
|
|
|
# Return the line (unstripped) if we don't.
|
1996-07-22 12:23:25 -03:00
|
|
|
for i in range(len(self.stack)):
|
|
|
|
sep = self.stack[i]
|
1998-08-11 23:38:11 -03:00
|
|
|
if marker == self.section_divider(sep):
|
1996-07-22 12:23:25 -03:00
|
|
|
self.last = 0
|
|
|
|
break
|
1998-08-11 23:38:11 -03:00
|
|
|
elif marker == self.end_marker(sep):
|
1996-07-22 12:23:25 -03:00
|
|
|
self.last = 1
|
|
|
|
break
|
|
|
|
else:
|
|
|
|
return line
|
1998-08-11 23:38:11 -03:00
|
|
|
# We only get here if we see a section divider or EOM line
|
|
|
|
if self.seekable:
|
|
|
|
self.lastpos = self.tell() - len(line)
|
1996-07-22 12:23:25 -03:00
|
|
|
self.level = i+1
|
|
|
|
if self.level > 1:
|
1998-08-11 23:38:11 -03:00
|
|
|
raise Error,'Missing endmarker in MultiFile.readline()'
|
1996-07-22 12:23:25 -03:00
|
|
|
return ''
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1996-07-22 12:23:25 -03:00
|
|
|
def readlines(self):
|
|
|
|
list = []
|
|
|
|
while 1:
|
|
|
|
line = self.readline()
|
|
|
|
if not line: break
|
|
|
|
list.append(line)
|
|
|
|
return list
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1996-07-22 12:23:25 -03:00
|
|
|
def read(self): # Note: no size argument -- read until EOF only!
|
|
|
|
return string.joinfields(self.readlines(), '')
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1996-07-22 12:23:25 -03:00
|
|
|
def next(self):
|
|
|
|
while self.readline(): pass
|
|
|
|
if self.level > 1 or self.last:
|
|
|
|
return 0
|
|
|
|
self.level = 0
|
|
|
|
self.last = 0
|
1998-08-11 23:38:11 -03:00
|
|
|
if self.seekable:
|
|
|
|
self.start = self.fp.tell()
|
1996-07-22 12:23:25 -03:00
|
|
|
return 1
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1996-07-22 12:23:25 -03:00
|
|
|
def push(self, sep):
|
|
|
|
if self.level > 0:
|
|
|
|
raise Error, 'bad MultiFile.push() call'
|
|
|
|
self.stack.insert(0, sep)
|
1998-08-11 23:38:11 -03:00
|
|
|
if self.seekable:
|
|
|
|
self.posstack.insert(0, self.start)
|
|
|
|
self.start = self.fp.tell()
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1996-07-22 12:23:25 -03:00
|
|
|
def pop(self):
|
|
|
|
if self.stack == []:
|
|
|
|
raise Error, 'bad MultiFile.pop() call'
|
|
|
|
if self.level <= 1:
|
|
|
|
self.last = 0
|
|
|
|
else:
|
|
|
|
abslastpos = self.lastpos + self.start
|
|
|
|
self.level = max(0, self.level - 1)
|
|
|
|
del self.stack[0]
|
1998-08-11 23:38:11 -03:00
|
|
|
if self.seekable:
|
|
|
|
self.start = self.posstack[0]
|
|
|
|
del self.posstack[0]
|
|
|
|
if self.level > 0:
|
|
|
|
self.lastpos = abslastpos - self.start
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1998-08-11 23:38:11 -03:00
|
|
|
def is_data(self, line):
|
|
|
|
return line[:2] <> '--'
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1998-08-11 23:38:11 -03:00
|
|
|
def section_divider(self, str):
|
|
|
|
return "--" + str
|
2000-05-08 14:31:04 -03:00
|
|
|
|
1998-08-11 23:38:11 -03:00
|
|
|
def end_marker(self, str):
|
|
|
|
return "--" + str + "--"
|