lxml>=2.3.3
regex>=1
numpy
scipy
scikit-learn==0.23.1
chardet>=1.0.1
cchardet>=0.3.5
cssselect
six>=1.10.0
html5lib