Files
api/path/to/venv/lib/python3.12/site-packages/mammoth/raw_text.py
2025-12-30 11:27:14 +07:00

15 lines
435 B
Python

from . import documents
def extract_raw_text_from_element(element):
if isinstance(element, documents.Text):
return element.value
elif isinstance(element, documents.Tab):
return "\t"
else:
text = "".join(map(extract_raw_text_from_element, getattr(element, "children", [])))
if isinstance(element, documents.Paragraph):
return text + "\n\n"
else:
return text