-
-
Notifications
You must be signed in to change notification settings - Fork 125
/
Copy pathraw_text_tests.py
57 lines (37 loc) · 1.35 KB
/
raw_text_tests.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
from mammoth.raw_text import extract_raw_text_from_element
from mammoth import documents
from .testing import assert_equal
def test_text_element_is_converted_to_text_content():
element = documents.Text("Hello.")
result = extract_raw_text_from_element(element)
assert_equal("Hello.", result)
def test_tab_element_is_converted_to_tab_character():
element = documents.tab()
result = extract_raw_text_from_element(element)
assert_equal("\t", result)
def test_paragraphs_are_terminated_with_newlines():
element = documents.paragraph(
children=[
documents.Text("Hello "),
documents.Text("world."),
],
)
result = extract_raw_text_from_element(element)
assert_equal("Hello world.\n\n", result)
def test_children_are_recursively_converted_to_text():
element = documents.document([
documents.paragraph(
[
documents.text("Hello "),
documents.text("world.")
],
{}
)
])
result = extract_raw_text_from_element(element)
assert_equal("Hello world.\n\n", result)
def test_non_text_element_without_children_is_converted_to_empty_string():
element = documents.line_break
assert not hasattr(element, "children")
result = extract_raw_text_from_element(element)
assert_equal("", result)