d3fbf2e51f
So, Python Markdown is a bottomless pit of horrors, including crippling parsing bugs, random out of nowhere, lack of features. It's definitely much faster, than Pandoc, but Pandoc doesn't go full retard where there's a regex in a fenced code block, that happens to be a regex for markdown elements. Also added some ugly post string replacements to make Pandoc fenced code output work with Prism: instead of the Pandoc <pre class="codelang"><code>, Prism wants <pre><code class="language-codelang>, so I added a regex sub, because it's 00:32.
44 lines
1.1 KiB
Python
44 lines
1.1 KiB
Python
import subprocess
|
|
import logging
|
|
|
|
def pandoc(text):
|
|
# TODO: cache?
|
|
# import hashlib
|
|
# print(hashlib.md5("whatever your string is".encode('utf-8')).hexdigest())
|
|
|
|
""" Pandoc command line call with piped in- and output """
|
|
cmd = (
|
|
'pandoc',
|
|
'-o-',
|
|
'--from=markdown+%s' % (
|
|
'+'.join([
|
|
'footnotes',
|
|
'pipe_tables',
|
|
'raw_html',
|
|
'definition_lists',
|
|
'backtick_code_blocks',
|
|
'fenced_code_attributes',
|
|
'shortcut_reference_links',
|
|
'lists_without_preceding_blankline',
|
|
'autolink_bare_uris',
|
|
])
|
|
),
|
|
'--to=html5',
|
|
'--quiet',
|
|
'--no-highlight'
|
|
)
|
|
p = subprocess.Popen(
|
|
cmd,
|
|
stdin=subprocess.PIPE,
|
|
stdout=subprocess.PIPE,
|
|
stderr=subprocess.PIPE,
|
|
)
|
|
|
|
stdout, stderr = p.communicate(input=text.encode())
|
|
if stderr:
|
|
logging.warning(
|
|
"Error during pandoc covert:\n\t%s\n\t%s",
|
|
cmd,
|
|
stderr
|
|
)
|
|
return stdout.decode('utf-8').strip()
|