>> pip install textract import textract text = textract.process('path/to/pdf/file', method='pdfminer')