2000-02-04 11:28:42 -04:00
|
|
|
"""A lexical analyzer class for simple shell-like syntaxes."""
|
|
|
|
|
2001-01-17 04:48:39 -04:00
|
|
|
# Module and documentation by Eric S. Raymond, 21 Dec 1998
|
2000-05-01 17:08:46 -03:00
|
|
|
# Input stacking and error message cleanup added by ESR, March 2000
|
2001-01-17 04:48:39 -04:00
|
|
|
# push_source() and pop_source() made explicit by ESR, January 2001.
|
2003-04-17 18:31:33 -03:00
|
|
|
# Posix compliance, split(), string arguments, and
|
|
|
|
# iterator interface by Gustavo Niemeyer, April 2003.
|
1998-12-22 01:19:29 -04:00
|
|
|
|
2000-07-03 06:56:23 -03:00
|
|
|
import os.path
|
1999-05-03 15:14:16 -03:00
|
|
|
import sys
|
2004-01-29 02:37:52 -04:00
|
|
|
from collections import deque
|
1998-12-22 01:19:29 -04:00
|
|
|
|
2007-05-17 21:51:22 -03:00
|
|
|
from io import StringIO
|
2003-04-17 18:31:33 -03:00
|
|
|
|
|
|
|
__all__ = ["shlex", "split"]
|
2001-02-15 18:15:14 -04:00
|
|
|
|
1998-12-22 01:19:29 -04:00
|
|
|
class shlex:
|
2001-01-17 04:48:39 -04:00
|
|
|
"A lexical analyzer class for simple shell-like syntaxes."
|
2003-04-17 19:01:17 -03:00
|
|
|
def __init__(self, instream=None, infile=None, posix=False):
|
2007-10-16 15:12:55 -03:00
|
|
|
if isinstance(instream, str):
|
2003-04-17 18:31:33 -03:00
|
|
|
instream = StringIO(instream)
|
2002-06-01 21:40:05 -03:00
|
|
|
if instream is not None:
|
1998-12-22 01:19:29 -04:00
|
|
|
self.instream = instream
|
2000-05-01 17:08:46 -03:00
|
|
|
self.infile = infile
|
1998-12-22 01:19:29 -04:00
|
|
|
else:
|
|
|
|
self.instream = sys.stdin
|
2000-05-01 17:08:46 -03:00
|
|
|
self.infile = None
|
2003-04-17 18:31:33 -03:00
|
|
|
self.posix = posix
|
|
|
|
if posix:
|
|
|
|
self.eof = None
|
|
|
|
else:
|
|
|
|
self.eof = ''
|
1998-12-22 01:19:29 -04:00
|
|
|
self.commenters = '#'
|
2000-07-09 13:44:26 -03:00
|
|
|
self.wordchars = ('abcdfeghijklmnopqrstuvwxyz'
|
|
|
|
'ABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789_')
|
2003-04-17 18:31:33 -03:00
|
|
|
if self.posix:
|
2010-10-27 15:52:48 -03:00
|
|
|
self.wordchars += ('ßàáâãäåæçèéêëìíîïðñòóôõöøùúûüýþÿ'
|
|
|
|
'ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖØÙÚÛÜÝÞ')
|
1998-12-22 01:19:29 -04:00
|
|
|
self.whitespace = ' \t\r\n'
|
2003-04-17 19:01:17 -03:00
|
|
|
self.whitespace_split = False
|
1998-12-22 01:19:29 -04:00
|
|
|
self.quotes = '\'"'
|
2003-04-17 18:31:33 -03:00
|
|
|
self.escape = '\\'
|
|
|
|
self.escapedquotes = '"'
|
1998-12-22 01:19:29 -04:00
|
|
|
self.state = ' '
|
2004-01-29 02:37:52 -04:00
|
|
|
self.pushback = deque()
|
1998-12-22 01:19:29 -04:00
|
|
|
self.lineno = 1
|
|
|
|
self.debug = 0
|
|
|
|
self.token = ''
|
2004-01-29 02:37:52 -04:00
|
|
|
self.filestack = deque()
|
2000-05-01 17:08:46 -03:00
|
|
|
self.source = None
|
|
|
|
if self.debug:
|
2007-02-09 01:37:30 -04:00
|
|
|
print('shlex: reading from %s, line %d' \
|
|
|
|
% (self.instream, self.lineno))
|
1998-12-22 01:19:29 -04:00
|
|
|
|
|
|
|
def push_token(self, tok):
|
|
|
|
"Push a token onto the stack popped by the get_token method"
|
2000-05-01 17:08:46 -03:00
|
|
|
if self.debug >= 1:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: pushing token " + repr(tok))
|
2004-01-29 02:37:52 -04:00
|
|
|
self.pushback.appendleft(tok)
|
1998-12-22 01:19:29 -04:00
|
|
|
|
2001-01-16 11:19:13 -04:00
|
|
|
def push_source(self, newstream, newfile=None):
|
|
|
|
"Push an input source onto the lexer's input source stack."
|
2007-10-16 15:12:55 -03:00
|
|
|
if isinstance(newstream, str):
|
2003-04-17 18:31:33 -03:00
|
|
|
newstream = StringIO(newstream)
|
2004-01-29 02:37:52 -04:00
|
|
|
self.filestack.appendleft((self.infile, self.instream, self.lineno))
|
2001-01-16 11:19:13 -04:00
|
|
|
self.infile = newfile
|
|
|
|
self.instream = newstream
|
|
|
|
self.lineno = 1
|
|
|
|
if self.debug:
|
2002-06-01 21:40:05 -03:00
|
|
|
if newfile is not None:
|
2007-02-09 01:37:30 -04:00
|
|
|
print('shlex: pushing to file %s' % (self.infile,))
|
2001-01-16 11:19:13 -04:00
|
|
|
else:
|
2007-02-09 01:37:30 -04:00
|
|
|
print('shlex: pushing to stream %s' % (self.instream,))
|
2001-01-16 11:19:13 -04:00
|
|
|
|
|
|
|
def pop_source(self):
|
|
|
|
"Pop the input source stack."
|
|
|
|
self.instream.close()
|
2004-01-29 02:37:52 -04:00
|
|
|
(self.infile, self.instream, self.lineno) = self.filestack.popleft()
|
2001-01-16 11:19:13 -04:00
|
|
|
if self.debug:
|
2007-02-09 01:37:30 -04:00
|
|
|
print('shlex: popping to %s, line %d' \
|
|
|
|
% (self.instream, self.lineno))
|
2001-01-16 11:19:13 -04:00
|
|
|
self.state = ' '
|
|
|
|
|
1998-12-22 01:19:29 -04:00
|
|
|
def get_token(self):
|
2000-05-01 17:08:46 -03:00
|
|
|
"Get a token from the input stream (or from stack if it's nonempty)"
|
1998-12-22 01:19:29 -04:00
|
|
|
if self.pushback:
|
2004-01-29 02:37:52 -04:00
|
|
|
tok = self.pushback.popleft()
|
2000-05-01 17:08:46 -03:00
|
|
|
if self.debug >= 1:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: popping token " + repr(tok))
|
1998-12-22 01:19:29 -04:00
|
|
|
return tok
|
2000-07-09 13:44:26 -03:00
|
|
|
# No pushback. Get a token.
|
2000-05-01 17:08:46 -03:00
|
|
|
raw = self.read_token()
|
|
|
|
# Handle inclusions
|
2003-04-17 18:31:33 -03:00
|
|
|
if self.source is not None:
|
|
|
|
while raw == self.source:
|
|
|
|
spec = self.sourcehook(self.read_token())
|
|
|
|
if spec:
|
|
|
|
(newfile, newstream) = spec
|
|
|
|
self.push_source(newstream, newfile)
|
|
|
|
raw = self.get_token()
|
2000-05-01 17:08:46 -03:00
|
|
|
# Maybe we got EOF instead?
|
2003-04-17 18:31:33 -03:00
|
|
|
while raw == self.eof:
|
2003-04-17 19:01:17 -03:00
|
|
|
if not self.filestack:
|
2003-04-17 18:31:33 -03:00
|
|
|
return self.eof
|
2000-05-01 17:08:46 -03:00
|
|
|
else:
|
2001-01-16 11:19:13 -04:00
|
|
|
self.pop_source()
|
2000-05-01 17:08:46 -03:00
|
|
|
raw = self.get_token()
|
2003-04-17 18:31:33 -03:00
|
|
|
# Neither inclusion nor EOF
|
2000-05-01 17:08:46 -03:00
|
|
|
if self.debug >= 1:
|
2003-04-17 18:31:33 -03:00
|
|
|
if raw != self.eof:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: token=" + repr(raw))
|
2000-05-01 17:08:46 -03:00
|
|
|
else:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: token=EOF")
|
2000-05-01 17:08:46 -03:00
|
|
|
return raw
|
|
|
|
|
|
|
|
def read_token(self):
|
2003-04-17 19:01:17 -03:00
|
|
|
quoted = False
|
2003-04-17 18:31:33 -03:00
|
|
|
escapedstate = ' '
|
2003-04-17 20:09:08 -03:00
|
|
|
while True:
|
2000-12-23 10:20:24 -04:00
|
|
|
nextchar = self.instream.read(1)
|
1998-12-22 01:19:29 -04:00
|
|
|
if nextchar == '\n':
|
|
|
|
self.lineno = self.lineno + 1
|
|
|
|
if self.debug >= 3:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: in state", repr(self.state), \
|
|
|
|
"I see character:", repr(nextchar))
|
2000-07-09 13:44:26 -03:00
|
|
|
if self.state is None:
|
2001-01-16 11:19:13 -04:00
|
|
|
self.token = '' # past end of file
|
2000-05-01 17:08:46 -03:00
|
|
|
break
|
1998-12-22 01:19:29 -04:00
|
|
|
elif self.state == ' ':
|
|
|
|
if not nextchar:
|
2001-01-16 11:19:13 -04:00
|
|
|
self.state = None # end of file
|
1998-12-22 01:19:29 -04:00
|
|
|
break
|
|
|
|
elif nextchar in self.whitespace:
|
|
|
|
if self.debug >= 2:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: I see whitespace in whitespace state")
|
2003-04-17 18:31:33 -03:00
|
|
|
if self.token or (self.posix and quoted):
|
2000-07-09 13:44:26 -03:00
|
|
|
break # emit current token
|
1998-12-22 01:19:29 -04:00
|
|
|
else:
|
|
|
|
continue
|
|
|
|
elif nextchar in self.commenters:
|
|
|
|
self.instream.readline()
|
|
|
|
self.lineno = self.lineno + 1
|
2003-04-17 18:31:33 -03:00
|
|
|
elif self.posix and nextchar in self.escape:
|
|
|
|
escapedstate = 'a'
|
|
|
|
self.state = nextchar
|
1998-12-22 01:19:29 -04:00
|
|
|
elif nextchar in self.wordchars:
|
|
|
|
self.token = nextchar
|
|
|
|
self.state = 'a'
|
|
|
|
elif nextchar in self.quotes:
|
2003-04-17 18:31:33 -03:00
|
|
|
if not self.posix:
|
|
|
|
self.token = nextchar
|
1998-12-22 01:19:29 -04:00
|
|
|
self.state = nextchar
|
2003-04-17 18:31:33 -03:00
|
|
|
elif self.whitespace_split:
|
|
|
|
self.token = nextchar
|
|
|
|
self.state = 'a'
|
1998-12-22 01:19:29 -04:00
|
|
|
else:
|
|
|
|
self.token = nextchar
|
2003-04-17 18:31:33 -03:00
|
|
|
if self.token or (self.posix and quoted):
|
2000-07-09 13:44:26 -03:00
|
|
|
break # emit current token
|
1998-12-22 01:19:29 -04:00
|
|
|
else:
|
|
|
|
continue
|
|
|
|
elif self.state in self.quotes:
|
2003-04-17 19:01:17 -03:00
|
|
|
quoted = True
|
2003-04-17 18:31:33 -03:00
|
|
|
if not nextchar: # end of file
|
2001-01-08 23:01:15 -04:00
|
|
|
if self.debug >= 2:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: I see EOF in quotes state")
|
2001-01-08 23:01:15 -04:00
|
|
|
# XXX what error should be raised here?
|
2007-08-29 22:19:48 -03:00
|
|
|
raise ValueError("No closing quotation")
|
2003-04-17 18:31:33 -03:00
|
|
|
if nextchar == self.state:
|
|
|
|
if not self.posix:
|
|
|
|
self.token = self.token + nextchar
|
|
|
|
self.state = ' '
|
|
|
|
break
|
|
|
|
else:
|
|
|
|
self.state = 'a'
|
|
|
|
elif self.posix and nextchar in self.escape and \
|
|
|
|
self.state in self.escapedquotes:
|
|
|
|
escapedstate = self.state
|
|
|
|
self.state = nextchar
|
|
|
|
else:
|
|
|
|
self.token = self.token + nextchar
|
|
|
|
elif self.state in self.escape:
|
|
|
|
if not nextchar: # end of file
|
|
|
|
if self.debug >= 2:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: I see EOF in escape state")
|
2003-04-17 18:31:33 -03:00
|
|
|
# XXX what error should be raised here?
|
2007-08-29 22:19:48 -03:00
|
|
|
raise ValueError("No escaped character")
|
2003-04-17 18:31:33 -03:00
|
|
|
# In posix shells, only the quote itself or the escape
|
|
|
|
# character may be escaped within quotes.
|
|
|
|
if escapedstate in self.quotes and \
|
|
|
|
nextchar != self.state and nextchar != escapedstate:
|
|
|
|
self.token = self.token + self.state
|
|
|
|
self.token = self.token + nextchar
|
|
|
|
self.state = escapedstate
|
1998-12-22 01:19:29 -04:00
|
|
|
elif self.state == 'a':
|
|
|
|
if not nextchar:
|
2001-01-17 04:48:39 -04:00
|
|
|
self.state = None # end of file
|
1998-12-22 01:19:29 -04:00
|
|
|
break
|
|
|
|
elif nextchar in self.whitespace:
|
|
|
|
if self.debug >= 2:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: I see whitespace in word state")
|
1998-12-22 01:19:29 -04:00
|
|
|
self.state = ' '
|
2003-04-17 18:31:33 -03:00
|
|
|
if self.token or (self.posix and quoted):
|
2000-07-09 13:44:26 -03:00
|
|
|
break # emit current token
|
1998-12-22 01:19:29 -04:00
|
|
|
else:
|
|
|
|
continue
|
|
|
|
elif nextchar in self.commenters:
|
|
|
|
self.instream.readline()
|
|
|
|
self.lineno = self.lineno + 1
|
2003-04-17 18:31:33 -03:00
|
|
|
if self.posix:
|
|
|
|
self.state = ' '
|
|
|
|
if self.token or (self.posix and quoted):
|
|
|
|
break # emit current token
|
|
|
|
else:
|
|
|
|
continue
|
|
|
|
elif self.posix and nextchar in self.quotes:
|
|
|
|
self.state = nextchar
|
|
|
|
elif self.posix and nextchar in self.escape:
|
|
|
|
escapedstate = 'a'
|
|
|
|
self.state = nextchar
|
|
|
|
elif nextchar in self.wordchars or nextchar in self.quotes \
|
|
|
|
or self.whitespace_split:
|
1998-12-22 01:19:29 -04:00
|
|
|
self.token = self.token + nextchar
|
|
|
|
else:
|
2004-01-29 02:37:52 -04:00
|
|
|
self.pushback.appendleft(nextchar)
|
1998-12-22 01:19:29 -04:00
|
|
|
if self.debug >= 2:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: I see punctuation in word state")
|
1999-03-22 11:28:08 -04:00
|
|
|
self.state = ' '
|
1998-12-22 01:19:29 -04:00
|
|
|
if self.token:
|
2000-07-09 13:44:26 -03:00
|
|
|
break # emit current token
|
1998-12-22 01:19:29 -04:00
|
|
|
else:
|
|
|
|
continue
|
|
|
|
result = self.token
|
|
|
|
self.token = ''
|
2003-04-17 18:31:33 -03:00
|
|
|
if self.posix and not quoted and result == '':
|
|
|
|
result = None
|
2000-05-01 17:08:46 -03:00
|
|
|
if self.debug > 1:
|
|
|
|
if result:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: raw token=" + repr(result))
|
2000-05-01 17:08:46 -03:00
|
|
|
else:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("shlex: raw token=EOF")
|
1998-12-22 01:19:29 -04:00
|
|
|
return result
|
|
|
|
|
2000-05-01 17:08:46 -03:00
|
|
|
def sourcehook(self, newfile):
|
|
|
|
"Hook called on a filename to be sourced."
|
|
|
|
if newfile[0] == '"':
|
|
|
|
newfile = newfile[1:-1]
|
2000-07-03 06:56:23 -03:00
|
|
|
# This implements cpp-like semantics for relative-path inclusion.
|
2007-10-16 15:12:55 -03:00
|
|
|
if isinstance(self.infile, str) and not os.path.isabs(newfile):
|
2000-07-03 06:56:23 -03:00
|
|
|
newfile = os.path.join(os.path.dirname(self.infile), newfile)
|
2000-05-01 17:08:46 -03:00
|
|
|
return (newfile, open(newfile, "r"))
|
|
|
|
|
2000-05-01 17:14:12 -03:00
|
|
|
def error_leader(self, infile=None, lineno=None):
|
|
|
|
"Emit a C-compiler-like, Emacs-friendly error-message leader."
|
2002-06-01 21:40:05 -03:00
|
|
|
if infile is None:
|
2000-05-01 17:14:12 -03:00
|
|
|
infile = self.infile
|
2002-06-01 21:40:05 -03:00
|
|
|
if lineno is None:
|
2000-05-01 17:14:12 -03:00
|
|
|
lineno = self.lineno
|
|
|
|
return "\"%s\", line %d: " % (infile, lineno)
|
|
|
|
|
2003-04-17 18:31:33 -03:00
|
|
|
def __iter__(self):
|
|
|
|
return self
|
|
|
|
|
2007-04-21 12:47:16 -03:00
|
|
|
def __next__(self):
|
2003-04-17 18:31:33 -03:00
|
|
|
token = self.get_token()
|
|
|
|
if token == self.eof:
|
|
|
|
raise StopIteration
|
|
|
|
return token
|
|
|
|
|
Merged revisions 55631-55794 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/branches/p3yk
................
r55636 | neal.norwitz | 2007-05-29 00:06:39 -0700 (Tue, 29 May 2007) | 149 lines
Merged revisions 55506-55635 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk
........
r55507 | georg.brandl | 2007-05-22 07:28:17 -0700 (Tue, 22 May 2007) | 2 lines
Remove the "panel" module doc file which has been ignored since 1994.
........
r55522 | mark.hammond | 2007-05-22 19:04:28 -0700 (Tue, 22 May 2007) | 4 lines
Remove definition of PY_UNICODE_TYPE from pyconfig.h, allowing the
definition in unicodeobject.h to be used, giving us the desired
wchar_t in place of 'unsigned short'. As discussed on python-dev.
........
r55525 | neal.norwitz | 2007-05-22 23:35:32 -0700 (Tue, 22 May 2007) | 6 lines
Add -3 option to the interpreter to warn about features that are
deprecated and will be changed/removed in Python 3.0.
This patch is mostly from Anthony. I tweaked some format and added
a little doc.
........
r55527 | neal.norwitz | 2007-05-22 23:57:35 -0700 (Tue, 22 May 2007) | 1 line
Whitespace cleanup
........
r55528 | neal.norwitz | 2007-05-22 23:58:36 -0700 (Tue, 22 May 2007) | 1 line
Add a bunch more deprecation warnings for builtins that are going away in 3.0
........
r55549 | georg.brandl | 2007-05-24 09:49:29 -0700 (Thu, 24 May 2007) | 2 lines
shlex.split() now has an optional "posix" parameter.
........
r55550 | georg.brandl | 2007-05-24 10:33:33 -0700 (Thu, 24 May 2007) | 2 lines
Fix parameter passing.
........
r55555 | facundo.batista | 2007-05-24 10:50:54 -0700 (Thu, 24 May 2007) | 6 lines
Added an optional timeout parameter to urllib.ftpwrapper, with tests
(for this and a basic one, because there weren't any). Changed also
NEWS, but didn't find documentation for this function, assumed it
wasn't public...
........
r55563 | facundo.batista | 2007-05-24 13:01:59 -0700 (Thu, 24 May 2007) | 4 lines
Removed the .recv() in the test, is not necessary, and was
causing problems that didn't have anything to do with was
actually being tested...
........
r55564 | facundo.batista | 2007-05-24 13:51:19 -0700 (Thu, 24 May 2007) | 5 lines
Let's see if reading exactly what is written allow this live
test to pass (now I know why there were so few tests in ftp,
http, etc, :( ).
........
r55567 | facundo.batista | 2007-05-24 20:10:28 -0700 (Thu, 24 May 2007) | 4 lines
Trying to make the tests work in Windows and Solaris, everywhere
else just works
........
r55568 | facundo.batista | 2007-05-24 20:47:19 -0700 (Thu, 24 May 2007) | 4 lines
Fixing stupid error, and introducing a sleep, to see if the
other thread is awakened and finish sending data.
........
r55569 | facundo.batista | 2007-05-24 21:20:22 -0700 (Thu, 24 May 2007) | 4 lines
Commenting out the tests until find out who can test them in
one of the problematic enviroments.
........
r55570 | neal.norwitz | 2007-05-24 22:13:40 -0700 (Thu, 24 May 2007) | 2 lines
Get test passing again by commenting out the reference to the test class.
........
r55575 | vinay.sajip | 2007-05-25 00:05:59 -0700 (Fri, 25 May 2007) | 1 line
Updated docstring for SysLogHandler (#1720726).
........
r55576 | vinay.sajip | 2007-05-25 00:06:55 -0700 (Fri, 25 May 2007) | 1 line
Updated documentation for SysLogHandler (#1720726).
........
r55592 | brett.cannon | 2007-05-25 13:17:15 -0700 (Fri, 25 May 2007) | 3 lines
Remove direct call's to file's constructor and replace them with calls to
open() as ths is considered best practice.
........
r55601 | kristjan.jonsson | 2007-05-26 12:19:50 -0700 (Sat, 26 May 2007) | 1 line
Remove the rgbimgmodule from PCBuild8
........
r55602 | kristjan.jonsson | 2007-05-26 12:31:39 -0700 (Sat, 26 May 2007) | 1 line
Include <windows.h> after python.h, so that WINNT is properly set before windows.h is included. Fixes warnings in PC builds.
........
r55603 | walter.doerwald | 2007-05-26 14:04:13 -0700 (Sat, 26 May 2007) | 2 lines
Fix typo.
........
r55604 | peter.astrand | 2007-05-26 15:18:20 -0700 (Sat, 26 May 2007) | 1 line
Applied patch 1669481, slightly modified: Support close_fds on Win32
........
r55606 | neal.norwitz | 2007-05-26 21:08:54 -0700 (Sat, 26 May 2007) | 2 lines
Add the new function object attribute names from py3k.
........
r55617 | lars.gustaebel | 2007-05-27 12:49:30 -0700 (Sun, 27 May 2007) | 20 lines
Added errors argument to TarFile class that allows the user to
specify an error handling scheme for character conversion. Additional
scheme "utf-8" in read mode. Unicode input filenames are now
supported by design. The values of the pax_headers dictionary are now
limited to unicode objects.
Fixed: The prefix field is no longer used in PAX_FORMAT (in
conformance with POSIX).
Fixed: In read mode use a possible pax header size field.
Fixed: Strip trailing slashes from pax header name values.
Fixed: Give values in user-specified pax_headers precedence when
writing.
Added unicode tests. Added pax/regtype4 member to testtar.tar all
possible number fields in a pax header.
Added two chapters to the documentation about the different formats
tarfile.py supports and how unicode issues are handled.
........
r55618 | raymond.hettinger | 2007-05-27 22:23:22 -0700 (Sun, 27 May 2007) | 1 line
Explain when groupby() issues a new group.
........
r55634 | martin.v.loewis | 2007-05-28 21:01:29 -0700 (Mon, 28 May 2007) | 2 lines
Test pre-commit hook for a link to a .py file.
........
r55635 | martin.v.loewis | 2007-05-28 21:02:03 -0700 (Mon, 28 May 2007) | 2 lines
Revert 55634.
........
................
r55639 | neal.norwitz | 2007-05-29 00:58:11 -0700 (Tue, 29 May 2007) | 1 line
Remove sys.exc_{type,exc_value,exc_traceback}
................
r55641 | neal.norwitz | 2007-05-29 01:03:50 -0700 (Tue, 29 May 2007) | 1 line
Missed one sys.exc_type. I wonder why exc_{value,traceback} were already gone
................
r55642 | neal.norwitz | 2007-05-29 01:08:33 -0700 (Tue, 29 May 2007) | 1 line
Missed more doc for sys.exc_* attrs.
................
r55643 | neal.norwitz | 2007-05-29 01:18:19 -0700 (Tue, 29 May 2007) | 1 line
Remove sys.exc_clear()
................
r55665 | guido.van.rossum | 2007-05-29 19:45:43 -0700 (Tue, 29 May 2007) | 4 lines
Make None, True, False keywords.
We can now also delete all the other places that explicitly forbid
assignment to None, but I'm not going to bother right now.
................
r55666 | guido.van.rossum | 2007-05-29 20:01:51 -0700 (Tue, 29 May 2007) | 3 lines
Found another place that needs check for forbidden names.
Fixed test_syntax.py accordingly (it helped me find that one).
................
r55668 | guido.van.rossum | 2007-05-29 20:41:48 -0700 (Tue, 29 May 2007) | 2 lines
Mark None, True, False as keywords.
................
r55673 | neal.norwitz | 2007-05-29 23:28:25 -0700 (Tue, 29 May 2007) | 3 lines
Get the dis module working on modules again after changing dicts
to not return lists and also new-style classes. Add a test.
................
r55674 | neal.norwitz | 2007-05-29 23:35:45 -0700 (Tue, 29 May 2007) | 1 line
Umm, it helps to add the module that the test uses
................
r55675 | neal.norwitz | 2007-05-29 23:53:05 -0700 (Tue, 29 May 2007) | 4 lines
Try to fix up all the other places that were assigning to True/False.
There's at least one more problem in test.test_xmlrpc. I have other
changes in that file and that should be fixed soon (I hope).
................
r55679 | neal.norwitz | 2007-05-30 00:31:55 -0700 (Wed, 30 May 2007) | 1 line
Fix up another place that was assigning to True/False.
................
r55688 | brett.cannon | 2007-05-30 14:19:47 -0700 (Wed, 30 May 2007) | 2 lines
Ditch MimeWriter.
................
r55692 | brett.cannon | 2007-05-30 14:52:00 -0700 (Wed, 30 May 2007) | 2 lines
Remove the mimify module.
................
r55707 | guido.van.rossum | 2007-05-31 05:08:45 -0700 (Thu, 31 May 2007) | 2 lines
Backport the addition of show_code() to dis.py -- it's too handy.
................
r55708 | guido.van.rossum | 2007-05-31 06:22:57 -0700 (Thu, 31 May 2007) | 7 lines
Fix a fairly long-standing bug in the check for assignment to None (and other
keywords, these days). In 2.5, you could write foo(None=1) without getting
a SyntaxError (although foo()'s definition would have to use **kwds to avoid
getting a runtime error complaining about an unknown keyword of course).
This ought to be backported to 2.5.2 or at least 2.6.
................
r55724 | brett.cannon | 2007-05-31 19:32:41 -0700 (Thu, 31 May 2007) | 2 lines
Remove the cfmfile.
................
r55727 | neal.norwitz | 2007-05-31 22:19:44 -0700 (Thu, 31 May 2007) | 1 line
Remove reload() builtin.
................
r55729 | neal.norwitz | 2007-05-31 22:51:30 -0700 (Thu, 31 May 2007) | 59 lines
Merged revisions 55636-55728 via svnmerge from
svn+ssh://pythondev@svn.python.org/python/trunk
........
r55637 | georg.brandl | 2007-05-29 00:16:47 -0700 (Tue, 29 May 2007) | 2 lines
Fix rst markup.
........
r55638 | neal.norwitz | 2007-05-29 00:51:39 -0700 (Tue, 29 May 2007) | 1 line
Fix typo in doc
........
r55671 | neal.norwitz | 2007-05-29 21:53:41 -0700 (Tue, 29 May 2007) | 1 line
Fix indentation (whitespace only).
........
r55676 | thomas.heller | 2007-05-29 23:58:30 -0700 (Tue, 29 May 2007) | 1 line
Fix compiler warnings.
........
r55677 | thomas.heller | 2007-05-30 00:01:25 -0700 (Wed, 30 May 2007) | 2 lines
Correct the name of a field in the WIN32_FIND_DATAA and WIN32_FIND_DATAW structures.
Closes bug #1726026.
........
r55686 | brett.cannon | 2007-05-30 13:46:26 -0700 (Wed, 30 May 2007) | 2 lines
Have MimeWriter raise a DeprecationWarning as per PEP 4 and its documentation.
........
r55690 | brett.cannon | 2007-05-30 14:48:58 -0700 (Wed, 30 May 2007) | 3 lines
Have mimify raise a DeprecationWarning. The docs and PEP 4 have listed the
module as deprecated for a while.
........
r55696 | brett.cannon | 2007-05-30 15:24:28 -0700 (Wed, 30 May 2007) | 2 lines
Have md5 raise a DeprecationWarning as per PEP 4.
........
r55705 | neal.norwitz | 2007-05-30 21:14:22 -0700 (Wed, 30 May 2007) | 1 line
Add some spaces in the example code.
........
r55716 | brett.cannon | 2007-05-31 12:20:00 -0700 (Thu, 31 May 2007) | 2 lines
Have the sha module raise a DeprecationWarning as specified in PEP 4.
........
r55719 | brett.cannon | 2007-05-31 12:40:42 -0700 (Thu, 31 May 2007) | 2 lines
Cause buildtools to raise a DeprecationWarning.
........
r55721 | brett.cannon | 2007-05-31 13:01:11 -0700 (Thu, 31 May 2007) | 2 lines
Have cfmfile raise a DeprecationWarning as per PEP 4.
........
r55726 | neal.norwitz | 2007-05-31 21:56:47 -0700 (Thu, 31 May 2007) | 1 line
Mail if there is an installation failure.
........
................
r55730 | neal.norwitz | 2007-05-31 23:22:07 -0700 (Thu, 31 May 2007) | 2 lines
Remove the code that was missed in rev 55303.
................
r55738 | neal.norwitz | 2007-06-01 19:10:43 -0700 (Fri, 01 Jun 2007) | 1 line
Fix doc breakage
................
r55741 | neal.norwitz | 2007-06-02 00:41:58 -0700 (Sat, 02 Jun 2007) | 1 line
Remove timing module (plus some remnants of other modules).
................
r55742 | neal.norwitz | 2007-06-02 00:51:44 -0700 (Sat, 02 Jun 2007) | 1 line
Remove posixfile module (plus some remnants of other modules).
................
r55744 | neal.norwitz | 2007-06-02 10:18:56 -0700 (Sat, 02 Jun 2007) | 1 line
Fix doc breakage.
................
r55745 | neal.norwitz | 2007-06-02 11:32:16 -0700 (Sat, 02 Jun 2007) | 1 line
Make a whatsnew 3.0 template.
................
r55754 | neal.norwitz | 2007-06-03 23:24:18 -0700 (Sun, 03 Jun 2007) | 1 line
SF #1730441, os._execvpe raises UnboundLocal due to new try/except semantics
................
r55755 | neal.norwitz | 2007-06-03 23:26:00 -0700 (Sun, 03 Jun 2007) | 1 line
Get rid of extra whitespace
................
r55794 | guido.van.rossum | 2007-06-06 15:29:22 -0700 (Wed, 06 Jun 2007) | 3 lines
Make this compile in GCC 2.96, which does not allow interspersing
declarations and code.
................
2007-06-06 20:52:48 -03:00
|
|
|
def split(s, comments=False, posix=True):
|
|
|
|
lex = shlex(s, posix=posix)
|
2003-04-19 22:57:03 -03:00
|
|
|
lex.whitespace_split = True
|
|
|
|
if not comments:
|
|
|
|
lex.commenters = ''
|
2003-04-17 18:31:33 -03:00
|
|
|
return list(lex)
|
1998-12-22 01:19:29 -04:00
|
|
|
|
2001-01-17 04:48:39 -04:00
|
|
|
if __name__ == '__main__':
|
2000-07-03 06:56:23 -03:00
|
|
|
if len(sys.argv) == 1:
|
|
|
|
lexer = shlex()
|
|
|
|
else:
|
|
|
|
file = sys.argv[1]
|
|
|
|
lexer = shlex(open(file), file)
|
1998-12-22 01:19:29 -04:00
|
|
|
while 1:
|
|
|
|
tt = lexer.get_token()
|
2000-07-03 06:56:23 -03:00
|
|
|
if tt:
|
2007-02-09 01:37:30 -04:00
|
|
|
print("Token: " + repr(tt))
|
2000-07-03 06:56:23 -03:00
|
|
|
else:
|
1998-12-22 01:19:29 -04:00
|
|
|
break
|