b2737d4980
* python3Packages.tensorflow-datasets: init at 4.4.0 * Update pkgs/development/python-modules/tensorflow-datasets/default.nix Co-authored-by: Dmitry Kalinkin <dmitry.kalinkin@gmail.com> Co-authored-by: Samuel Ainsworth <skainsworth@gmail.com> Co-authored-by: Dmitry Kalinkin <dmitry.kalinkin@gmail.com>
142 lines
3.2 KiB
Nix
142 lines
3.2 KiB
Nix
{ apache-beam
|
|
, attrs
|
|
, beautifulsoup4
|
|
, buildPythonPackage
|
|
, dill
|
|
, dm-tree
|
|
, fetchFromGitHub
|
|
, ffmpeg
|
|
, future
|
|
, imagemagick
|
|
, importlib-resources
|
|
, jinja2
|
|
, langdetect
|
|
, lib
|
|
, matplotlib
|
|
, mwparserfromhell
|
|
, networkx
|
|
, nltk
|
|
, numpy
|
|
, opencv4
|
|
, pandas
|
|
, pillow
|
|
, promise
|
|
, protobuf
|
|
, pycocotools
|
|
, pydub
|
|
, pytestCheckHook
|
|
, requests
|
|
, scikitimage
|
|
, scipy
|
|
, six
|
|
, tensorflow
|
|
, tensorflow-metadata
|
|
, termcolor
|
|
, tifffile
|
|
, tqdm
|
|
}:
|
|
|
|
buildPythonPackage rec {
|
|
pname = "tensorflow-datasets";
|
|
version = "4.4.0";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "tensorflow";
|
|
repo = "datasets";
|
|
rev = "v${version}";
|
|
sha256 = "11kbpv54nwr0xf7z5mkj2lmrfqfmcdq8qcpapnqck1kiawr3yad6";
|
|
};
|
|
|
|
patches = [
|
|
# addresses https://github.com/tensorflow/datasets/issues/3673
|
|
./corruptions.patch
|
|
];
|
|
|
|
propagatedBuildInputs = [
|
|
attrs
|
|
dill
|
|
dm-tree
|
|
future
|
|
importlib-resources
|
|
numpy
|
|
promise
|
|
protobuf
|
|
requests
|
|
six
|
|
tensorflow-metadata
|
|
termcolor
|
|
tqdm
|
|
];
|
|
|
|
pythonImportsCheck = [
|
|
"tensorflow_datasets"
|
|
];
|
|
|
|
checkInputs = [
|
|
apache-beam
|
|
beautifulsoup4
|
|
ffmpeg
|
|
imagemagick
|
|
jinja2
|
|
langdetect
|
|
matplotlib
|
|
mwparserfromhell
|
|
networkx
|
|
nltk
|
|
opencv4
|
|
pandas
|
|
pillow
|
|
pycocotools
|
|
pydub
|
|
pytestCheckHook
|
|
scikitimage
|
|
scipy
|
|
tensorflow
|
|
tifffile
|
|
];
|
|
|
|
disabledTestPaths = [
|
|
# Sandbox violations: network access, filesystem write attempts outside of build dir, ...
|
|
"tensorflow_datasets/core/dataset_builder_test.py"
|
|
"tensorflow_datasets/core/dataset_info_test.py"
|
|
"tensorflow_datasets/core/features/features_test.py"
|
|
"tensorflow_datasets/core/github_api/github_path_test.py"
|
|
"tensorflow_datasets/core/utils/gcs_utils_test.py"
|
|
"tensorflow_datasets/scripts/cli/build_test.py"
|
|
|
|
# Requires `pretty_midi` which is not packaged in `nixpkgs`.
|
|
"tensorflow_datasets/audio/groove_test.py"
|
|
|
|
# Requires `crepe` which is not packaged in `nixpkgs`.
|
|
"tensorflow_datasets/audio/nsynth_test.py"
|
|
|
|
# Requires `gcld3` and `pretty_midi` which are not packaged in `nixpkgs`.
|
|
"tensorflow_datasets/core/lazy_imports_lib_test.py"
|
|
|
|
# Requires `tensorflow_io` which is not packaged in `nixpkgs`.
|
|
"tensorflow_datasets/image/lsun_test.py"
|
|
|
|
# Fails with `TypeError: Constant constructor takes either 0 or 2 positional arguments`
|
|
# deep in TF AutoGraph. Doesn't reproduce in Docker with Ubuntu 22.04 => might be related
|
|
# to the differences in some of the dependencies?
|
|
"tensorflow_datasets/rl_unplugged/rlu_atari/rlu_atari_test.py"
|
|
|
|
# Requires `tensorflow_docs` which is not packaged in `nixpkgs` and the test is for documentation anyway.
|
|
"tensorflow_datasets/scripts/documentation/build_api_docs_test.py"
|
|
|
|
# Not a test, should not be executed.
|
|
"tensorflow_datasets/testing/test_utils.py"
|
|
|
|
# Require `gcld3` and `nltk.punkt` which are not packaged in `nixpkgs`.
|
|
"tensorflow_datasets/text/c4_test.py"
|
|
"tensorflow_datasets/text/c4_utils_test.py"
|
|
];
|
|
|
|
meta = with lib; {
|
|
description = "Library of datasets ready to use with TensorFlow";
|
|
homepage = "https://www.tensorflow.org/datasets/overview";
|
|
license = licenses.asl20;
|
|
maintainers = with maintainers; [ ndl ];
|
|
};
|
|
}
|