2020-09-10 19:18:22 +01:00
|
|
|
{ lib
|
|
|
|
, buildPythonPackage
|
|
|
|
, fetchFromGitHub
|
|
|
|
, dill
|
|
|
|
, filelock
|
2021-03-07 07:03:43 +00:00
|
|
|
, fsspec
|
|
|
|
, huggingface-hub
|
2020-11-08 07:22:07 +00:00
|
|
|
, multiprocess
|
2020-09-10 19:18:22 +01:00
|
|
|
, numpy
|
|
|
|
, pandas
|
|
|
|
, pyarrow
|
|
|
|
, requests
|
|
|
|
, tqdm
|
|
|
|
, xxhash
|
|
|
|
}:
|
|
|
|
|
|
|
|
buildPythonPackage rec {
|
|
|
|
pname = "datasets";
|
2021-03-07 07:03:43 +00:00
|
|
|
version = "1.4.1";
|
2020-09-10 19:18:22 +01:00
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "huggingface";
|
|
|
|
repo = pname;
|
|
|
|
rev = version;
|
2021-03-07 07:03:43 +00:00
|
|
|
hash = "sha256-is8TS84varARWyfeDTbQH0pcYFTk0PcEyK183emB4GE=";
|
2020-09-10 19:18:22 +01:00
|
|
|
};
|
|
|
|
|
|
|
|
propagatedBuildInputs = [
|
|
|
|
dill
|
|
|
|
filelock
|
2021-03-07 07:03:43 +00:00
|
|
|
fsspec
|
|
|
|
huggingface-hub
|
2020-11-08 07:22:07 +00:00
|
|
|
multiprocess
|
2020-09-10 19:18:22 +01:00
|
|
|
numpy
|
|
|
|
pandas
|
|
|
|
pyarrow
|
|
|
|
requests
|
|
|
|
tqdm
|
|
|
|
xxhash
|
|
|
|
];
|
|
|
|
|
2020-12-29 20:46:24 +00:00
|
|
|
postPatch = ''
|
2021-03-07 07:03:43 +00:00
|
|
|
substituteInPlace setup.py \
|
|
|
|
--replace '"tqdm>=4.27,<4.50.0"' '"tqdm>=4.27"' \
|
|
|
|
--replace "huggingface_hub==0.0.2" "huggingface_hub>=0.0.2"
|
2020-12-29 20:46:24 +00:00
|
|
|
'';
|
|
|
|
|
2020-09-10 19:18:22 +01:00
|
|
|
# Tests require pervasive internet access.
|
|
|
|
doCheck = false;
|
|
|
|
|
|
|
|
# Module import will attempt to create a cache directory.
|
|
|
|
postFixup = "export HF_MODULES_CACHE=$TMPDIR";
|
|
|
|
|
|
|
|
pythonImportsCheck = [ "datasets" ];
|
|
|
|
|
|
|
|
meta = with lib; {
|
|
|
|
homepage = "https://github.com/huggingface/datasets";
|
|
|
|
description = "Fast, efficient, open-access datasets and evaluation metrics for natural language processing";
|
|
|
|
changelog = "https://github.com/huggingface/datasets/releases/tag/${version}";
|
|
|
|
license = licenses.asl20;
|
|
|
|
platforms = platforms.unix;
|
|
|
|
maintainers = with maintainers; [ danieldk ];
|
|
|
|
};
|
|
|
|
}
|