e2f87b7d5f
Changes: * Vectors.most_similar returns the top most similar vectors instead only one. * Fixes tag map in Dutch model. * Fix initialization of DocBin with attributes.
78 lines
1.2 KiB
Nix
78 lines
1.2 KiB
Nix
{ lib
|
|
, buildPythonPackage
|
|
, fetchPypi
|
|
, pythonOlder
|
|
, pytest
|
|
, preshed
|
|
, ftfy
|
|
, numpy
|
|
, murmurhash
|
|
, plac
|
|
, ujson
|
|
, dill
|
|
, requests
|
|
, thinc
|
|
, regex
|
|
, cymem
|
|
, pathlib
|
|
, msgpack
|
|
, msgpack-numpy
|
|
, jsonschema
|
|
, blis
|
|
, wasabi
|
|
, srsly
|
|
, setuptools
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "spacy";
|
|
version = "2.2.1";
|
|
|
|
src = fetchPypi {
|
|
inherit pname version;
|
|
sha256 = "1a833dx8i4s106fk42x4dnayaq5p3qxaxnc012xij991i09v2pxn";
|
|
};
|
|
|
|
prePatch = ''
|
|
substituteInPlace setup.cfg \
|
|
--replace "plac<1.0.0,>=0.9.6" "plac>=0.9.6"
|
|
'';
|
|
|
|
propagatedBuildInputs = [
|
|
numpy
|
|
murmurhash
|
|
cymem
|
|
preshed
|
|
thinc
|
|
plac
|
|
ujson
|
|
dill
|
|
requests
|
|
regex
|
|
ftfy
|
|
msgpack
|
|
msgpack-numpy
|
|
jsonschema
|
|
blis
|
|
wasabi
|
|
srsly
|
|
setuptools
|
|
] ++ lib.optional (pythonOlder "3.4") pathlib;
|
|
|
|
checkInputs = [
|
|
pytest
|
|
];
|
|
|
|
doCheck = false;
|
|
# checkPhase = ''
|
|
# ${python.interpreter} -m pytest spacy/tests --vectors --models --slow
|
|
# '';
|
|
|
|
meta = with lib; {
|
|
description = "Industrial-strength Natural Language Processing (NLP) with Python and Cython";
|
|
homepage = https://github.com/explosion/spaCy;
|
|
license = licenses.mit;
|
|
maintainers = with maintainers; [ danieldk sdll ];
|
|
};
|
|
}
|