:
# - make script usable as a module
# - use class tags and style sheet instead of
"""
class Parser:
""" Send colored python source.
"""
stylesheet = _STYLESHEET
def __init__(self, raw, out=sys.stdout):
""" Store the source text.
"""
self.raw = raw.expandtabs().strip()
self.out = out
def format(self):
""" Parse and send the colored source.
"""
# store line offsets in self.lines
self.lines = [0, 0]
pos = 0
while 1:
pos = self.raw.find(b'\n', pos) + 1
if not pos: break
self.lines.append(pos)
self.lines.append(len(self.raw))
# parse the source and write it
self.pos = 0
if PY2:
text = cStringIO.StringIO(self.raw)
else:
text = io.BytesIO(self.raw)
self.out.write(makebytes(self.stylesheet))
self.out.write(b'\n')
try:
if PY2:
tokenize.tokenize(text.readline, self)
else:
for a,b,c,d,e in tokenize.tokenize(text.readline):
self(a,b,c,d,e)
except tokenize.TokenError as ex:
msg = ex[0]
line = ex[1][0]
self.out.write("ERROR: %s
%s\n" % (
msg, self.raw[self.lines[line]:]))
except IndentationError as ex:
msg = ex[0]
self.out.write("ERROR: %s
\n" % (msg))
self.out.write(b'\n')
def __call__(self, toktype, toktext, startpos, endpos, line):
""" Token handler.
"""
if 0:
print("type %s %s text %s start %s %s end %s %s
\n" % \
(toktype, token.tok_name[toktype], toktext, \
srow, scol,erow,ecol))
srow, scol = startpos
erow, ecol = endpos
# calculate new positions
oldpos = self.pos
newpos = self.lines[srow] + scol
self.pos = newpos + len(toktext)
# handle newlines
if toktype in [token.NEWLINE, tokenize.NL]:
self.out.write(b'\n')
return
# send the original whitespace, if needed
if newpos > oldpos:
self.out.write(self.raw[oldpos:newpos])
# skip indenting tokens
if toktype in [token.INDENT, token.DEDENT]:
self.pos = newpos
return
# map token type to a color group
if token.LPAR <= toktype and toktype <= token.OP:
toktype = token.OP
elif toktype == token.NAME and keyword.iskeyword(toktext):
toktype = _KEYWORD
css_class = _css_classes.get(toktype, 'text')
# send text
self.out.write(makebytes('' % (css_class,)))
self.out.write(makebytes(cgi.escape(toktext)))
self.out.write(b'')
def colorize_file(file=None, outstream=sys.stdout, standalone=True):
"""Convert a python source file into colorized HTML.
Reads file and writes to outstream (default sys.stdout). file can be a
filename or a file-like object (only the read method is used). If file is
None, act as a filter and read from sys.stdin. If standalone is True
(default), send a complete HTML document with header and footer. Otherwise
only a stylesheet and a section are written.
"""
from os.path import basename
if hasattr(file, 'read'):
sourcefile = file
file = None
try:
filename = basename(file.name)
except:
filename = 'STREAM'
elif file is not None:
try:
sourcefile = open(file, 'rb')
filename = basename(file)
except IOError:
raise SystemExit("File %s unknown." % file)
else:
sourcefile = sys.stdin
filename = 'STDIN'
source = sourcefile.read()
if standalone:
outstream.write(makebytes(_HTML_HEADER % {'title': filename}))
Parser(source, out=outstream).format()
if standalone:
outstream.write(makebytes(_HTML_FOOTER))
if file:
sourcefile.close()
if __name__ == "__main__":
import os
if PY2:
out = sys.stdout
else:
out = sys.stdout.buffer
if os.environ.get('PATH_TRANSLATED'):
filepath = os.environ.get('PATH_TRANSLATED')
print('Content-Type: text/html; charset="iso-8859-1"\n')
colorize_file(filepath, out)
elif len(sys.argv) > 1:
filepath = sys.argv[1]
colorize_file(filepath, out)
else:
colorize_file()