nltk
scikit-learn
beautifulsoup4
pdfminer.six
python-docx
pdfplumber
numpy
scipy
