lxml>=2.3.3
regex>=1
html2text
numpy
scipy
scikit-learn==0.16.1
