Source code for textract.parsers.docx_parser

import docx

from .utils import BaseParser


[docs]class Parser(BaseParser): """Extract text from docx file using python-docx. """
[docs] def extract(self, filename, **kwargs): document = docx.Document(filename) return '\n\n'.join([ paragraph.text for paragraph in document.paragraphs ])