mirror of
https://github.com/randogoth/md2mu.git
synced 2025-12-22 08:27:09 +00:00
underlines + cleanup
This commit is contained in:
187
md2mu.py
187
md2mu.py
@@ -1,49 +1,146 @@
|
|||||||
import mistune
|
import mistune
|
||||||
|
from mistune import Markdown
|
||||||
|
from mistune.core import BlockState
|
||||||
|
from mistune.util import strip_end
|
||||||
|
from mistune.renderers._list import render_list
|
||||||
|
from mistune.renderers.markdown import MarkdownRenderer
|
||||||
|
from typing import Dict, Any
|
||||||
|
from textwrap import indent
|
||||||
import argparse
|
import argparse
|
||||||
|
import re
|
||||||
|
|
||||||
class Markdown2Micron(mistune.HTMLRenderer):
|
UNDERLINED = r'\b_{1,3}(?=[^\s_])'
|
||||||
def text(self, text) -> str:
|
UNDERLINED_END_RE = {
|
||||||
return text
|
'_': re.compile(r'(?:(?<!\\)(?:\\\\)*\\_|[^\s_])_(?!_)\b'),
|
||||||
def emphasis(self, text: str) -> str:
|
'__': re.compile(r'(?:(?<!\\)(?:\\\\)*\\_|[^\s_])__(?!_)\b'),
|
||||||
return '`*' + text + '`*'
|
'___': re.compile(r'(?:(?<!\\)(?:\\\\)*\\_|[^\s_])___(?!_)\b'),
|
||||||
def strong(self, text: str) -> str:
|
}
|
||||||
return '`!' + text + '`!'
|
|
||||||
def codespan(self, text: str) -> str:
|
def parse_underlined(inline, m, state):
|
||||||
return '`=' + text + '`='
|
print(inline, m, state)
|
||||||
def heading(self, text, level, **attrs) -> str:
|
text = m.group(2)
|
||||||
|
print('rrr')
|
||||||
|
state.append_token({'type': 'underlined', 'raw': text})
|
||||||
|
return m.end()
|
||||||
|
|
||||||
|
def parse_underlined(self, m, state) -> int:
|
||||||
|
print(state)
|
||||||
|
pos = m.end()
|
||||||
|
marker = m.group(0)
|
||||||
|
mlen = len(marker)
|
||||||
|
_end_re = UNDERLINED_END_RE[marker]
|
||||||
|
m1 = _end_re.search(state.src, pos)
|
||||||
|
if not m1:
|
||||||
|
state.append_token({'type': 'text', 'raw': marker})
|
||||||
|
return pos
|
||||||
|
end_pos = m1.end()
|
||||||
|
text = state.src[pos:end_pos-mlen]
|
||||||
|
prec_pos = self.precedence_scan(m, state, end_pos)
|
||||||
|
if prec_pos:
|
||||||
|
return prec_pos
|
||||||
|
new_state = state.copy()
|
||||||
|
new_state.src = text
|
||||||
|
new_state.in_underlined = True
|
||||||
|
state.append_token({
|
||||||
|
'type': 'underlined',
|
||||||
|
'children': self.render(new_state),
|
||||||
|
})
|
||||||
|
return end_pos
|
||||||
|
|
||||||
|
def render_underlined(self, token, state) -> str:
|
||||||
|
return '`_' + self.render_children(token, state) + '`_'
|
||||||
|
|
||||||
|
class Markdown2Micron(MarkdownRenderer):
|
||||||
|
NAME = 'micron'
|
||||||
|
|
||||||
|
def __call__(self, tokens, state: BlockState):
|
||||||
|
out = self.render_tokens(tokens, state)
|
||||||
|
# special handle for line breaks
|
||||||
|
out += '\n\n'.join(self.render_referrences(state)) + '\n'
|
||||||
|
return strip_end(out)
|
||||||
|
|
||||||
|
def render_children(self, token, state: BlockState):
|
||||||
|
children = token['children']
|
||||||
|
return self.render_tokens(children, state)
|
||||||
|
|
||||||
|
def text(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return token['raw']
|
||||||
|
|
||||||
|
def emphasis(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return '`*' + self.render_children(token, state) + '`*'
|
||||||
|
|
||||||
|
def strong(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return '`!' + self.render_children(token, state) + '`!'
|
||||||
|
|
||||||
|
def link(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
label = token.get('label')
|
||||||
|
text = self.render_children(token, state)
|
||||||
|
out = '`[' + text + '`'
|
||||||
|
if label:
|
||||||
|
return out + '`[' + label + '`'
|
||||||
|
attrs = token['attrs']
|
||||||
|
url = attrs['url']
|
||||||
|
if text == url:
|
||||||
|
return '`[' + text + '`'
|
||||||
|
elif 'mailto:' + text == url:
|
||||||
|
return '`[' + text + '`'
|
||||||
|
out += url
|
||||||
|
return out + ']'
|
||||||
|
|
||||||
|
def image(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return self.link(token, state)
|
||||||
|
|
||||||
|
def codespan(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return '`=' + token['raw'] + '`='
|
||||||
|
|
||||||
|
def linebreak(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return ' \n'
|
||||||
|
|
||||||
|
def softbreak(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return '\n'
|
||||||
|
|
||||||
|
def blank_line(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return ''
|
||||||
|
|
||||||
|
def inline_html(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
return ''
|
||||||
|
|
||||||
|
def paragraph(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
text = self.render_children(token, state)
|
||||||
|
return text + '\n\n'
|
||||||
|
|
||||||
|
def heading(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
|
level = token['attrs']['level']
|
||||||
if level > 3:
|
if level > 3:
|
||||||
level = 3
|
level = 3
|
||||||
return '>' * level + text + '\n'
|
marker = '>' * level
|
||||||
def link(self, text: str, url: str, title=None) -> str:
|
text = self.render_children(token, state)
|
||||||
s = self.safe_url(url)
|
return marker + ' ' + text + '\n\n'
|
||||||
if text:
|
def thematic_break(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
s = text + '`' + s
|
return '-\n\n'
|
||||||
return f'`[{s}]'
|
|
||||||
def image(self, text: str, url: str, title=None) -> str:
|
def block_text(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
s = self.safe_url(url)
|
return self.render_children(token, state) + '\n'
|
||||||
if title:
|
|
||||||
s = title + '`' + s
|
def block_code(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
return f'`[{s}]'
|
code = token['raw']
|
||||||
def blank_line(self) -> str:
|
if code and code[-1] != '\n':
|
||||||
return '' + '\n'
|
code += '\n'
|
||||||
def linebreak(self) -> str:
|
marker = '`='
|
||||||
return '\n'
|
return marker + '\n' + code + marker + '\n\n'
|
||||||
def softbreak(self) -> str:
|
|
||||||
return '\n'
|
def block_quote(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
def inline_html(self, html: str) -> str:
|
text = indent(self.render_children(token, state), '>>>>')
|
||||||
return '`=\n' + html + '`=\n'
|
return text + '\n\n'
|
||||||
def thematic_break(self):
|
|
||||||
return '-' + '\n'
|
def block_html(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
def paragraph(self, text):
|
return ''
|
||||||
return text + '\n'
|
|
||||||
def block_quote(self, text: str) -> str:
|
def block_error(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
return '>>>>' + text
|
return ''
|
||||||
def list(self, text: str, ordered: bool, **attrs) -> str:
|
|
||||||
return text + '\n'
|
def list(self, token: Dict[str, Any], state: BlockState) -> str:
|
||||||
def list_item(self, text: str) -> str:
|
return render_list(self, token, state)
|
||||||
return '+ ' + text + '\n'
|
|
||||||
def block_code(self, code: str, info=None) -> str:
|
|
||||||
return '`=\n' + code + '`=\n'
|
|
||||||
|
|
||||||
def main():
|
def main():
|
||||||
|
|
||||||
@@ -55,11 +152,13 @@ def main():
|
|||||||
|
|
||||||
with open(args.md_file, 'r') as mdf:
|
with open(args.md_file, 'r') as mdf:
|
||||||
md_str = mdf.read()
|
md_str = mdf.read()
|
||||||
m2μ = Markdown2Micron()
|
m2μr = Markdown2Micron()
|
||||||
md2micron = mistune.create_markdown(renderer=m2μ)
|
m2μ = Markdown(renderer=m2μr)
|
||||||
|
m2μ.inline.register('underlined', UNDERLINED, parse_underlined, before='emphasis')
|
||||||
|
m2μ.renderer.register('underlined', render_underlined)
|
||||||
|
|
||||||
with open(args.mu_file, 'w') as muf:
|
with open(args.mu_file, 'w') as muf:
|
||||||
md_str = muf.write(md2micron(md_str))
|
md_str = muf.write(m2μ(md_str))
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
main()
|
main()
|
||||||
71
micron.mu
71
micron.mu
@@ -1,11 +1,16 @@
|
|||||||
>h1 Heading 8-)
|
> h1 Heading 8-)
|
||||||
>>h2 Heading
|
|
||||||
>>>h3 Heading
|
|
||||||
>>>h4 Heading
|
|
||||||
>>>h5 Heading
|
|
||||||
>>>h6 Heading
|
|
||||||
|
|
||||||
>>Horizontal Rules
|
>> h2 Heading
|
||||||
|
|
||||||
|
>>> h3 Heading
|
||||||
|
|
||||||
|
>>> h4 Heading
|
||||||
|
|
||||||
|
>>> h5 Heading
|
||||||
|
|
||||||
|
>>> h6 Heading
|
||||||
|
|
||||||
|
>> Horizontal Rules
|
||||||
|
|
||||||
-
|
-
|
||||||
|
|
||||||
@@ -13,43 +18,51 @@
|
|||||||
|
|
||||||
-
|
-
|
||||||
|
|
||||||
>>Emphasis
|
>> Emphasis
|
||||||
|
|
||||||
`!This is bold text`!
|
`!This is bold text`!
|
||||||
`!This is bold text`!
|
`_This is bold text`_
|
||||||
`*This is italic text`*
|
|
||||||
`*This is italic text`*
|
`*This is italic text`*
|
||||||
|
`_This is italic text`_
|
||||||
~~Strikethrough~~
|
~~Strikethrough~~
|
||||||
|
|
||||||
>>Blockquotes
|
>> Blockquotes
|
||||||
|
|
||||||
>>>>Blockquotes can also be nested...
|
>>>>Blockquotes can also be nested...
|
||||||
>>>>by using additional greater-than signs right next to each other...
|
|
||||||
>>>>or with spaces between arrows.
|
|
||||||
|
|
||||||
>>Lists
|
>>>>>>>>by using additional greater-than signs right next to each other...
|
||||||
|
|
||||||
>>>Unordered
|
>>>>>>>>>>>>or with spaces between arrows.
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
|
>> Lists
|
||||||
|
|
||||||
|
>>> Unordered
|
||||||
|
|
||||||
+ Create a list by starting a line with `=+`=, `=-`=, or `=*`=
|
+ Create a list by starting a line with `=+`=, `=-`=, or `=*`=
|
||||||
|
|
||||||
+ Marker character change forces new list start:
|
- Marker character change forces new list start:
|
||||||
|
|
||||||
+ Ac tristique libero volutpat at
|
* Ac tristique libero volutpat at
|
||||||
|
|
||||||
+ Facilisis in pretium nisl aliquet
|
+ Facilisis in pretium nisl aliquet
|
||||||
|
|
||||||
+ Nulla volutpat aliquam velit
|
- Nulla volutpat aliquam velit
|
||||||
|
|
||||||
+ Very easy
|
+ Very easy
|
||||||
|
|
||||||
>>>Ordered
|
>>> Ordered
|
||||||
|
|
||||||
+ Lorem ipsum dolor sit amet
|
1. Lorem ipsum dolor sit amet
|
||||||
+ Consectetur adipiscing elit
|
2. Consectetur adipiscing elit
|
||||||
+ Integer molestie lorem at massa
|
3. Integer molestie lorem at massa
|
||||||
|
|
||||||
>>Code
|
>> Code
|
||||||
|
|
||||||
Inline `=code`=
|
Inline `=code`=
|
||||||
|
|
||||||
@@ -59,7 +72,9 @@ Indented code
|
|||||||
// Some comments
|
// Some comments
|
||||||
line 1 of code
|
line 1 of code
|
||||||
line 2 of code
|
line 2 of code
|
||||||
line 3 of code`=
|
line 3 of code
|
||||||
|
`=
|
||||||
|
|
||||||
Block code "fences"
|
Block code "fences"
|
||||||
|
|
||||||
`=
|
`=
|
||||||
@@ -76,13 +91,13 @@ var foo = function (bar) {
|
|||||||
console.log(foo(5));
|
console.log(foo(5));
|
||||||
`=
|
`=
|
||||||
|
|
||||||
>>Links
|
>> Links
|
||||||
|
|
||||||
`[link text`http://dev.nodeca.com]
|
`[link text`http://dev.nodeca.com]
|
||||||
|
|
||||||
`[link with title`http://nodeca.github.io/pica/demo/]
|
`[link with title`http://nodeca.github.io/pica/demo/]
|
||||||
|
|
||||||
>>Images
|
>> Images
|
||||||
|
|
||||||
`[https://octodex.github.com/images/minion.png]
|
`[Minion`https://octodex.github.com/images/minion.png]
|
||||||
`[The Stormtroopocat`https://octodex.github.com/images/stormtroopocat.jpg]
|
`[Stormtroopocat`https://octodex.github.com/images/stormtroopocat.jpg]
|
||||||
|
|||||||
Reference in New Issue
Block a user