"""A more liberal autolinker Inspired by Django's urlize function. Positive examples: >>> import markdown >>> md = markdown.Markdown(extensions=['urlize']) >>> md.convert('http://example.com/') u'
' >>> md.convert('go to http://example.com') u'go to http://example.com
' >>> md.convert('example.com') u'' >>> md.convert('example.net') u'' >>> md.convert('www.example.us') u'' >>> md.convert('(www.example.us/path/?name=val)') u'(www.example.us/path/?name=val)
' >>> md.convert('go togo to http://example.com now!
' Negative examples: >>> md.convert('del.icio.us') u'del.icio.us
' """ import markdown # Global Vars URLIZE_RE = '(%s)' % '|'.join([ r'<(?:f|ht)tps?://[^>]*>', r'\b(?:f|ht)tps?://[^)<>\s]+[^.,)<>\s]', r'\bwww\.[^)<>\s]+[^.,)<>\s]', r'[^(<\s]+\.(?:com|net|org)\b', ]) class UrlizePattern(markdown.inlinepatterns.Pattern): """ Return a link Element given an autolink (`http://example/com`). """ def handleMatch(self, m): url = m.group(2) if url.startswith('<'): url = url[1:-1] text = url if not url.split('://')[0] in ('http','https','ftp'): if '@' in url and not '/' in url: url = 'mailto:' + url else: url = 'http://' + url el = markdown.util.etree.Element("a") el.set('href', url) el.text = markdown.util.AtomicString(text) return el class UrlizeExtension(markdown.Extension): """ Urlize Extension for Python-Markdown. """ def extendMarkdown(self, md, md_globals): """ Replace autolink with UrlizePattern """ md.inlinePatterns['autolink'] = UrlizePattern(URLIZE_RE, md) def makeExtension(*args, **kwargs): return UrlizeExtension(*args, **kwargs) if __name__ == "__main__": import doctest doctest.testmod()