225 lines
7.5 KiB
Python
225 lines
7.5 KiB
Python
#!/usr/bin/python
|
|
|
|
"""
|
|
CodeHilite Extension for Python-Markdown
|
|
========================================
|
|
|
|
Adds code/syntax highlighting to standard Python-Markdown code blocks.
|
|
|
|
Copyright 2006-2008 [Waylan Limberg](http://achinghead.com/).
|
|
|
|
Project website: <http://www.freewisdom.org/project/python-markdown/CodeHilite>
|
|
Contact: markdown@freewisdom.org
|
|
|
|
License: BSD (see ../docs/LICENSE for details)
|
|
|
|
Dependencies:
|
|
* [Python 2.3+](http://python.org/)
|
|
* [Markdown 2.0+](http://www.freewisdom.org/projects/python-markdown/)
|
|
* [Pygments](http://pygments.org/)
|
|
|
|
"""
|
|
|
|
import markdown
|
|
|
|
# --------------- CONSTANTS YOU MIGHT WANT TO MODIFY -----------------
|
|
|
|
try:
|
|
TAB_LENGTH = markdown.TAB_LENGTH
|
|
except AttributeError:
|
|
TAB_LENGTH = 4
|
|
|
|
|
|
# ------------------ The Main CodeHilite Class ----------------------
|
|
class CodeHilite:
|
|
"""
|
|
Determine language of source code, and pass it into the pygments hilighter.
|
|
|
|
Basic Usage:
|
|
>>> code = CodeHilite(src = 'some text')
|
|
>>> html = code.hilite()
|
|
|
|
* src: Source string or any object with a .readline attribute.
|
|
|
|
* linenos: (Boolen) Turn line numbering 'on' or 'off' (off by default).
|
|
|
|
* css_class: Set class name of wrapper div ('codehilite' by default).
|
|
|
|
Low Level Usage:
|
|
>>> code = CodeHilite()
|
|
>>> code.src = 'some text' # String or anything with a .readline attr.
|
|
>>> code.linenos = True # True or False; Turns line numbering on or of.
|
|
>>> html = code.hilite()
|
|
|
|
"""
|
|
|
|
def __init__(self, src=None, linenos=False, css_class="codehilite"):
|
|
self.src = src
|
|
self.lang = None
|
|
self.linenos = linenos
|
|
self.css_class = css_class
|
|
|
|
def hilite(self):
|
|
"""
|
|
Pass code to the [Pygments](http://pygments.pocoo.org/) highliter with
|
|
optional line numbers. The output should then be styled with css to
|
|
your liking. No styles are applied by default - only styling hooks
|
|
(i.e.: <span class="k">).
|
|
|
|
returns : A string of html.
|
|
|
|
"""
|
|
|
|
self.src = self.src.strip('\n')
|
|
|
|
self._getLang()
|
|
|
|
try:
|
|
from pygments import highlight
|
|
from pygments.lexers import get_lexer_by_name, guess_lexer, \
|
|
TextLexer
|
|
from pygments.formatters import HtmlFormatter
|
|
except ImportError:
|
|
# just escape and pass through
|
|
txt = self._escape(self.src)
|
|
if self.linenos:
|
|
txt = self._number(txt)
|
|
else :
|
|
txt = '<div class="%s"><pre>%s</pre></div>\n'% \
|
|
(self.css_class, txt)
|
|
return txt
|
|
else:
|
|
try:
|
|
lexer = get_lexer_by_name(self.lang)
|
|
except ValueError:
|
|
try:
|
|
lexer = guess_lexer(self.src)
|
|
except ValueError:
|
|
lexer = TextLexer()
|
|
formatter = HtmlFormatter(linenos=self.linenos,
|
|
cssclass=self.css_class)
|
|
return highlight(self.src, lexer, formatter)
|
|
|
|
def _escape(self, txt):
|
|
""" basic html escaping """
|
|
txt = txt.replace('&', '&')
|
|
txt = txt.replace('<', '<')
|
|
txt = txt.replace('>', '>')
|
|
txt = txt.replace('"', '"')
|
|
return txt
|
|
|
|
def _number(self, txt):
|
|
""" Use <ol> for line numbering """
|
|
# Fix Whitespace
|
|
txt = txt.replace('\t', ' '*TAB_LENGTH)
|
|
txt = txt.replace(" "*4, " ")
|
|
txt = txt.replace(" "*3, " ")
|
|
txt = txt.replace(" "*2, " ")
|
|
|
|
# Add line numbers
|
|
lines = txt.splitlines()
|
|
txt = '<div class="codehilite"><pre><ol>\n'
|
|
for line in lines:
|
|
txt += '\t<li>%s</li>\n'% line
|
|
txt += '</ol></pre></div>\n'
|
|
return txt
|
|
|
|
|
|
def _getLang(self):
|
|
"""
|
|
Determines language of a code block from shebang lines and whether said
|
|
line should be removed or left in place. If the sheband line contains a
|
|
path (even a single /) then it is assumed to be a real shebang lines and
|
|
left alone. However, if no path is given (e.i.: #!python or :::python)
|
|
then it is assumed to be a mock shebang for language identifitation of a
|
|
code fragment and removed from the code block prior to processing for
|
|
code highlighting. When a mock shebang (e.i: #!python) is found, line
|
|
numbering is turned on. When colons are found in place of a shebang
|
|
(e.i.: :::python), line numbering is left in the current state - off
|
|
by default.
|
|
|
|
"""
|
|
|
|
import re
|
|
|
|
#split text into lines
|
|
lines = self.src.split("\n")
|
|
#pull first line to examine
|
|
fl = lines.pop(0)
|
|
|
|
c = re.compile(r'''
|
|
(?:(?:::+)|(?P<shebang>[#]!)) # Shebang or 2 or more colons.
|
|
(?P<path>(?:/\w+)*[/ ])? # Zero or 1 path
|
|
(?P<lang>[\w+-]*) # The language
|
|
''', re.VERBOSE)
|
|
# search first line for shebang
|
|
m = c.search(fl)
|
|
if m:
|
|
# we have a match
|
|
try:
|
|
self.lang = m.group('lang').lower()
|
|
except IndexError:
|
|
self.lang = None
|
|
if m.group('path'):
|
|
# path exists - restore first line
|
|
lines.insert(0, fl)
|
|
if m.group('shebang'):
|
|
# shebang exists - use line numbers
|
|
self.linenos = True
|
|
else:
|
|
# No match
|
|
lines.insert(0, fl)
|
|
|
|
self.src = "\n".join(lines).strip("\n")
|
|
|
|
|
|
|
|
# ------------------ The Markdown Extension -------------------------------
|
|
class HiliteTreeprocessor(markdown.treeprocessors.Treeprocessor):
|
|
""" Hilight source code in code blocks. """
|
|
|
|
def run(self, root):
|
|
""" Find code blocks and store in htmlStash. """
|
|
blocks = root.getiterator('pre')
|
|
for block in blocks:
|
|
children = block.getchildren()
|
|
if len(children) == 1 and children[0].tag == 'code':
|
|
code = CodeHilite(children[0].text,
|
|
linenos=self.config['force_linenos'][0],
|
|
css_class=self.config['css_class'][0])
|
|
placeholder = self.markdown.htmlStash.store(code.hilite(),
|
|
safe=True)
|
|
# Clear codeblock in etree instance
|
|
block.clear()
|
|
# Change to p element which will later
|
|
# be removed when inserting raw html
|
|
block.tag = 'p'
|
|
block.text = placeholder
|
|
|
|
|
|
class CodeHiliteExtension(markdown.Extension):
|
|
""" Add source code hilighting to markdown codeblocks. """
|
|
|
|
def __init__(self, configs):
|
|
# define default configs
|
|
self.config = {
|
|
'force_linenos' : [False, "Force line numbers - Default: False"],
|
|
'css_class' : ["codehilite",
|
|
"Set class name for wrapper <div> - Default: codehilite"],
|
|
}
|
|
|
|
# Override defaults with user settings
|
|
for key, value in configs:
|
|
self.setConfig(key, value)
|
|
|
|
def extendMarkdown(self, md, md_globals):
|
|
""" Add HilitePostprocessor to Markdown instance. """
|
|
hiliter = HiliteTreeprocessor(md)
|
|
hiliter.config = self.config
|
|
md.treeprocessors.add("hilite", hiliter, "_begin")
|
|
|
|
|
|
def makeExtension(configs={}):
|
|
return CodeHiliteExtension(configs=configs)
|
|
|