2017-09-13 01:01:01 +01:00
|
|
|
{ stdenv
|
|
|
|
, buildPythonPackage
|
|
|
|
, isPy27
|
|
|
|
, fetchPypi
|
|
|
|
, cachetools
|
|
|
|
, cld2-cffi
|
|
|
|
, cytoolz
|
|
|
|
, ftfy
|
|
|
|
, ijson
|
|
|
|
, matplotlib
|
|
|
|
, networkx
|
|
|
|
, numpy
|
|
|
|
, pyemd
|
|
|
|
, pyphen
|
|
|
|
, python-Levenshtein
|
|
|
|
, requests
|
|
|
|
, scikitlearn
|
|
|
|
, scipy
|
|
|
|
, spacy
|
|
|
|
, tqdm
|
|
|
|
, unidecode
|
|
|
|
}:
|
|
|
|
|
|
|
|
buildPythonPackage rec {
|
|
|
|
pname = "textacy";
|
2019-04-16 18:15:41 +01:00
|
|
|
version = "0.6.3";
|
2017-09-13 01:01:01 +01:00
|
|
|
|
|
|
|
src = fetchPypi {
|
|
|
|
inherit pname version;
|
2019-04-16 18:15:41 +01:00
|
|
|
sha256 = "50402545ac92b1a931c2365e341cb35c4ebe5575525f1dcc5265901ff3895a5f";
|
2017-09-13 01:01:01 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
propagatedBuildInputs = [
|
|
|
|
cachetools
|
|
|
|
cld2-cffi
|
|
|
|
cytoolz
|
|
|
|
ftfy
|
|
|
|
ijson
|
|
|
|
matplotlib
|
|
|
|
networkx
|
|
|
|
numpy
|
|
|
|
pyemd
|
|
|
|
pyphen
|
|
|
|
python-Levenshtein
|
|
|
|
requests
|
|
|
|
scikitlearn
|
|
|
|
scipy
|
|
|
|
spacy
|
|
|
|
tqdm
|
|
|
|
unidecode
|
|
|
|
];
|
|
|
|
|
2019-01-28 20:20:41 +00:00
|
|
|
postPatch = ''
|
|
|
|
substituteInPlace setup.py \
|
|
|
|
--replace "'ftfy>=4.2.0,<5.0.0'," "'ftfy>=5.0.0',"
|
|
|
|
'';
|
|
|
|
|
2017-09-13 01:01:01 +01:00
|
|
|
doCheck = false; # tests want to download data files
|
|
|
|
|
|
|
|
meta = with stdenv.lib; {
|
|
|
|
description = "Higher-level text processing, built on spaCy";
|
|
|
|
homepage = "http://textacy.readthedocs.io/";
|
|
|
|
license = licenses.asl20;
|
|
|
|
maintainers = with maintainers; [ rvl ];
|
2019-08-01 20:20:35 +01:00
|
|
|
# ftfy and jellyfish no longer support python2
|
|
|
|
# latest scikitlearn not supported for this: https://github.com/chartbeat-labs/textacy/issues/260
|
|
|
|
broken = true;
|
2017-09-13 01:01:01 +01:00
|
|
|
};
|
|
|
|
}
|