Skip to content

Commit

Permalink
feat!: add parent property to tokens (#71)
Browse files Browse the repository at this point in the history
At the same time, we also make the `children`
attribute a _property_. This makes it easier for us
to set the `parent` to every child token, without
having to change much of the existing code.
  • Loading branch information
pbodnar authored Jan 27, 2024
1 parent acde7c2 commit 06f2a93
Show file tree
Hide file tree
Showing 8 changed files with 57 additions and 8 deletions.
4 changes: 4 additions & 0 deletions dev-guide.md
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,10 @@ In this category you will find tokens like `RawText`, `Link`, and `Emphasis`.
Block tokens may have block tokens, span tokens, or no tokens at all as children
in the AST; this depends on the type of token. Span tokens may *only* have span
tokens as children.
Every token has properties called `children` and `parent` that can be used
for traversing the nodes hierarchy.

### Viewing the AST

In order to see what exactly gets parsed, one can simply use the `AstRenderer`
on a given markdown input, for example:
Expand Down
2 changes: 1 addition & 1 deletion mistletoe/ast_renderer.py
Original file line number Diff line number Diff line change
Expand Up @@ -42,7 +42,7 @@ def get_ast(token):
node[attrname] = getattr(token, attrname)
if 'header' in vars(token):
node['header'] = get_ast(getattr(token, 'header'))
if 'children' in vars(token):
if token.children is not None:
node['children'] = [get_ast(child) for child in token.children]
return node

Expand Down
2 changes: 1 addition & 1 deletion mistletoe/html_renderer.py
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,7 @@ def __exit__(self, *args):
super().__exit__(*args)

def render_to_plain(self, token) -> str:
if hasattr(token, 'children'):
if token.children is not None:
inner = [self.render_to_plain(child) for child in token.children]
return ''.join(inner)
return html.escape(token.content)
Expand Down
2 changes: 1 addition & 1 deletion mistletoe/span_token.py
Original file line number Diff line number Diff line change
Expand Up @@ -71,7 +71,7 @@ def __init__(self, match):
self.content = match.group(self.parse_group)

def __contains__(self, text):
if hasattr(self, 'children'):
if self.children is not None:
return any(text in child for child in self.children)
return text in self.content

Expand Down
29 changes: 28 additions & 1 deletion mistletoe/token.py
Original file line number Diff line number Diff line change
@@ -1,3 +1,5 @@
from typing import Iterable, Optional

"""
Base token class.
"""
Expand Down Expand Up @@ -54,7 +56,7 @@ def __repr__(self):
self.__class__.__name__
)

if "children" in vars(self):
if self.children is not None:
count = len(self.children)
if count == 1:
output += " with 1 child"
Expand All @@ -69,3 +71,28 @@ def __repr__(self):
output += " {}={}".format(attrname, _short_repr(attrvalue))
output += " at {:#x}>".format(id(self))
return output

@property
def parent(self) -> Optional['Token']:
"""Returns the parent token, if there is any."""
return getattr(self, '_parent', None)

@property
def children(self) -> Optional[Iterable['Token']]:
"""
Returns the child (nested) tokens.
Returns `None` if the token is a leaf token.
"""
return getattr(self, '_children', None)

@children.setter
def children(self, value: Iterable['Token']):
""""
Sets new child (nested) tokens.
Passed tokens are iterated and their ``parent`` property is set to
this token.
"""
self._children = value
if value:
for child in value:
child._parent = self
4 changes: 2 additions & 2 deletions mistletoe/utils.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,14 +20,14 @@ def traverse(source, klass=None, depth=None, include_source=False):
current_depth = 0
if include_source and (klass is None or isinstance(source, klass)):
yield TraverseResult(source, None, current_depth)
next_children = [(source, c) for c in getattr(source, 'children', [])]
next_children = [(source, c) for c in source.children or []]
while next_children and (depth is None or current_depth < depth):
current_depth += 1
new_children = []
for parent, child in next_children:
if klass is None or isinstance(child, klass):
yield TraverseResult(child, parent, current_depth)
new_children.extend(
[(child, c) for c in getattr(child, 'children', [])]
[(child, c) for c in child.children or []]
)
next_children = new_children
12 changes: 12 additions & 0 deletions test/test_block_token.py
Original file line number Diff line number Diff line change
Expand Up @@ -616,6 +616,18 @@ def test_contains(self):
self.assertFalse('foo' in token)


class TestParent(unittest.TestCase):
def test_parent(self):
lines = ['# heading\n', '\n', 'paragraph\n']
token = block_token.Document(lines)
self.assertEqual(len(token.children), 2)
self.assertIsNone(token.parent)
for child in token.children:
self.assertEqual(child.parent, token)
for grandchild in child.children:
self.assertEqual(grandchild.parent, child)


class TestHtmlBlock(unittest.TestCase):
def setUp(self):
block_token.add_token(block_token.HtmlBlock)
Expand Down
10 changes: 8 additions & 2 deletions test/test_span_token.py
Original file line number Diff line number Diff line change
Expand Up @@ -154,8 +154,7 @@ def test_attribute(self):

def test_no_children(self):
token = span_token.RawText('some text')
with self.assertRaises(AttributeError):
token.children
self.assertIsNone(token.children)

def test_valid_html_entities(self):
tokens = span_token.tokenize_inner('&nbsp; &#21512;')
Expand Down Expand Up @@ -192,6 +191,13 @@ def test_contains(self):
self.assertFalse('foo' in token)


class TestParent(unittest.TestCase):
def test_parent(self):
token, = span_token.tokenize_inner('**some text**')
self.assertIsInstance(token.children[0], span_token.RawText)
self.assertEqual(token.children[0].parent, token)


class TestHtmlSpan(unittest.TestCase):
def setUp(self):
span_token.add_token(span_token.HtmlSpan)
Expand Down

0 comments on commit 06f2a93

Please sign in to comment.