Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from docx.document import Document
- from docx.oxml.table import CT_Tbl
- from docx.oxml.text.paragraph import CT_P
- from docx.table import _Cell, Table
- from docx.text.paragraph import Paragraph
- def iter_block_items(parent):
- if isinstance(parent, Document):
- parent_elm = parent.element.body
- elif isinstance(parent, _Cell):
- parent_elm = parent._tc
- else:
- raise ValueError("something's not right")
- for child in parent_elm.iterchildren():
- if isinstance(child, CT_P):
- yield Paragraph(child, parent)
- elif isinstance(child, CT_Tbl):
- yield Table(child, parent)
- doc = Document('doc1.docx')
- result = [item for item in iter_block_items(doc)]
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement