Kaydet (Commit) 5da60397 authored tarafından Raymond Hettinger's avatar Raymond Hettinger

Refactor to isolate HTML encoding step from the parsing step.

üst 3575f910
...@@ -10,24 +10,23 @@ def is_builtin(s): ...@@ -10,24 +10,23 @@ def is_builtin(s):
'Return True if s is the name of a builtin' 'Return True if s is the name of a builtin'
return s in vars(__builtins__) return s in vars(__builtins__)
def escape_range(lines, start, end): def combine_range(lines, start, end):
'Return escaped content from a range of lines between start and end' 'Join content from a range of lines between start and end'
(srow, scol), (erow, ecol) = start, end (srow, scol), (erow, ecol) = start, end
if srow == erow: if srow == erow:
rows = [lines[srow-1][scol:ecol]] rows = [lines[srow-1][scol:ecol]]
else: else:
rows = [lines[srow-1][scol:]] + lines[srow: erow-1] + [lines[erow-1][:ecol]] rows = [lines[srow-1][scol:]] + lines[srow: erow-1] + [lines[erow-1][:ecol]]
return cgi.escape(''.join(rows)), end return ''.join(rows), end
def colorize(source): def isolate_tokens(source):
'Convert Python source code to an HTML fragment with colorized markup' 'Generate chunks of source and indentify chunks to be highlighted'
lines = source.splitlines(True) lines = source.splitlines(True)
lines.append('') lines.append('')
readline = functools.partial(next, iter(lines), '') readline = functools.partial(next, iter(lines), '')
kind = tok_str = '' kind = tok_str = ''
tok_type = tokenize.COMMENT tok_type = tokenize.COMMENT
written = (1, 0) written = (1, 0)
result = []
for tok in tokenize.generate_tokens(readline): for tok in tokenize.generate_tokens(readline):
prev_tok_type, prev_tok_str = tok_type, tok_str prev_tok_type, prev_tok_str = tok_type, tok_str
tok_type, tok_str, (srow, scol), (erow, ecol), logical_lineno = tok tok_type, tok_str, (srow, scol), (erow, ecol), logical_lineno = tok
...@@ -49,23 +48,29 @@ def colorize(source): ...@@ -49,23 +48,29 @@ def colorize(source):
kind = 'keyword' kind = 'keyword'
elif is_builtin(tok_str) and prev_tok_str != '.': elif is_builtin(tok_str) and prev_tok_str != '.':
kind = 'builtin' kind = 'builtin'
line_upto_token, written = combine_range(lines, written, (srow, scol))
line_thru_token, written = combine_range(lines, written, (erow, ecol))
yield kind, line_upto_token, line_thru_token
def colorize(source):
'Convert Python source code to an HTML fragment with colorized markup'
result = ['<pre class="python">\n']
for kind, line_upto_token, line_thru_token in isolate_tokens(source):
if kind: if kind:
line_upto_token, written = escape_range(lines, written, (srow, scol)) result += [cgi.escape(line_upto_token),
line_thru_token, written = escape_range(lines, written, (erow, ecol)) '<span class="%s">' % kind,
result += [line_upto_token, '<span class="%s">' % kind, cgi.escape(line_thru_token),
line_thru_token, '</span>'] '</span>']
else: else:
line_thru_token, written = escape_range(lines, written, (erow, ecol)) result += [cgi.escape(line_upto_token),
result += [line_thru_token] cgi.escape(line_thru_token)]
result += ['</pre>\n']
result.insert(0, '<pre class="python">\n')
result.append('</pre>\n')
return ''.join(result) return ''.join(result)
default_css = { default_css = {
'.comment': '{color: crimson;}', '.comment': '{color: crimson;}',
'.string': '{color: forestgreen;}', '.string': '{color: forestgreen;}',
'.docstring': '{color: forestgreen; font-style:italic}', '.docstring': '{color: forestgreen; font-style:italic;}',
'.keyword': '{color: darkorange;}', '.keyword': '{color: darkorange;}',
'.builtin': '{color: purple;}', '.builtin': '{color: purple;}',
'.definition': '{color: darkorange; font-weight:bold;}', '.definition': '{color: darkorange; font-weight:bold;}',
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment