nixpkgs/pkgs/development/python-modules/pytorch/default.nix

{ stdenv, lib, fetchFromGitHub, fetchpatch, buildPythonPackage, python,
  cudaSupport ? false, cudatoolkit ? null, cudnn ? null, nccl ? null, magma ? null,
  mklDnnSupport ? true, useSystemNccl ? true,
  openMPISupport ? false, openmpi ? null,
  buildDocs ? false,
  cudaArchList ? null,

  # Native build inputs
  cmake, util-linux, linkFarm, symlinkJoin, which,

  # Build inputs
  numactl,

  # Propagated build inputs
  dataclasses, numpy, pyyaml, cffi, click, typing-extensions,

  # Unit tests
  hypothesis, psutil,

  # virtual pkg that consistently instantiates blas across nixpkgs
  # See https://github.com/NixOS/nixpkgs/pull/83888
  blas,

  # ninja (https://ninja-build.org) must be available to run C++ extensions tests,
  ninja,

  # dependencies for torch.utils.tensorboard
  pillow, six, future, tensorflow-tensorboard, protobuf,

  isPy3k, pythonOlder }:

assert !openMPISupport || openmpi != null;

# assert that everything needed for cuda is present and that the correct cuda versions are used
assert !cudaSupport || cudatoolkit != null;
assert cudnn == null || cudatoolkit != null;
assert !cudaSupport || (let majorIs = lib.versions.major cudatoolkit.version;
                        in majorIs == "9" || majorIs == "10" || majorIs == "11");

# confirm that cudatoolkits are sync'd across dependencies
assert !(openMPISupport && cudaSupport) || openmpi.cudatoolkit == cudatoolkit;
assert !cudaSupport || magma.cudatoolkit == cudatoolkit;

let
  cudatoolkit_joined = symlinkJoin {
    name = "${cudatoolkit.name}-unsplit";
    # nccl is here purely for semantic grouping it could be moved to nativeBuildInputs
    paths = [ cudatoolkit.out cudatoolkit.lib nccl.dev nccl.out ];
  };

  # Give an explicit list of supported architectures for the build, See:
  # - pytorch bug report: https://github.com/pytorch/pytorch/issues/23573
  # - pytorch-1.2.0 build on nixpks: https://github.com/NixOS/nixpkgs/pull/65041
  #
  # This list was selected by omitting the TORCH_CUDA_ARCH_LIST parameter,
  # observing the fallback option (which selected all architectures known
  # from cudatoolkit_10_0, pytorch-1.2, and python-3.6), and doing a binary
  # searching to find offending architectures.
  #
  # NOTE: Because of sandboxing, this derivation can't auto-detect the hardware's
  # cuda architecture, so there is also now a problem around new architectures
  # not being supported until explicitly added to this derivation.
  #
  # FIXME: CMake is throwing the following warning on python-1.2:
  #
  # ```
  # CMake Warning at cmake/public/utils.cmake:172 (message):
  #   In the future we will require one to explicitly pass TORCH_CUDA_ARCH_LIST
  #   to cmake instead of implicitly setting it as an env variable.  This will
  #   become a FATAL_ERROR in future version of pytorch.
  # ```
  # If this is causing problems for your build, this derivation may have to strip
  # away the standard `buildPythonPackage` and use the
  # [*Adjust Build Options*](https://github.com/pytorch/pytorch/tree/v1.2.0#adjust-build-options-optional)
  # instructions. This will also add more flexibility around configurations
  # (allowing FBGEMM to be built in pytorch-1.1), and may future proof this
  # derivation.
  brokenArchs = [ "3.0" ]; # this variable is only used as documentation.
  cuda9ArchList = [
    "3.5"
    "5.0"
    "5.2"
    "6.0"
    "6.1"
    "7.0"
    "7.0+PTX"  # I am getting a "undefined architecture compute_75" on cuda 9
               # which leads me to believe this is the final cuda-9-compatible architecture.
  ];
  cuda10ArchList = cuda9ArchList ++ [
    "7.5"
    "7.5+PTX"  # < most recent architecture as of cudatoolkit_10_0 and pytorch-1.2.0
  ];
  final_cudaArchList =
    if !cudaSupport || cudaArchList != null
    then cudaArchList
    else
      if lib.versions.major cudatoolkit.version == "9"
      then cuda9ArchList
      else cuda10ArchList; # the assert above removes any ambiguity here.

  # Normally libcuda.so.1 is provided at runtime by nvidia-x11 via
  # LD_LIBRARY_PATH=/run/opengl-driver/lib.  We only use the stub
  # libcuda.so from cudatoolkit for running tests, so that we don’t have
  # to recompile pytorch on every update to nvidia-x11 or the kernel.
  cudaStub = linkFarm "cuda-stub" [{
    name = "libcuda.so.1";
    path = "${cudatoolkit}/lib/stubs/libcuda.so";
  }];
  cudaStubEnv = lib.optionalString cudaSupport
    "LD_LIBRARY_PATH=${cudaStub}\${LD_LIBRARY_PATH:+:}$LD_LIBRARY_PATH ";

in buildPythonPackage rec {
  pname = "pytorch";
  # Don't forget to update pytorch-bin to the same version.
  version = "1.7.0";

  disabled = !isPy3k;

  outputs = [
    "out"   # output standard python package
    "dev"   # output libtorch headers
    "lib"   # output libtorch libraries
  ];

  src = fetchFromGitHub {
    owner  = "pytorch";
    repo   = "pytorch";
    rev    = "v${version}";
    fetchSubmodules = true;
    sha256 = "0hb11m5kvs4nsi5bc9ijnv6k07593p9dw40rcn33s9vspinrcjd4";
  };

  patches = lib.optionals stdenv.isDarwin [
    # pthreadpool added support for Grand Central Dispatch in April
    # 2020. However, this relies on functionality (DISPATCH_APPLY_AUTO)
    # that is available starting with macOS 10.13. However, our current
    # base is 10.12. Until we upgrade, we can fall back on the older
    # pthread support.
    ./pthreadpool-disable-gcd.diff
  ];

  # The dataclasses module is included with Python >= 3.7. This should
  # be fixed with the next PyTorch release.
  postPatch = ''
    substituteInPlace setup.py \
      --replace "'dataclasses'" "'dataclasses; python_version < \"3.7\"'"
  '';

  preConfigure = lib.optionalString cudaSupport ''
    export TORCH_CUDA_ARCH_LIST="${lib.strings.concatStringsSep ";" final_cudaArchList}"
    export CC=${cudatoolkit.cc}/bin/gcc CXX=${cudatoolkit.cc}/bin/g++
  '' + lib.optionalString (cudaSupport && cudnn != null) ''
    export CUDNN_INCLUDE_DIR=${cudnn}/include
  '';

  # Use pytorch's custom configurations
  dontUseCmakeConfigure = true;

  BUILD_NAMEDTENSOR = true;
  BUILD_DOCS = buildDocs;

  USE_MKL = blas.implementation == "mkl";

  # Unlike MKL, oneDNN (née MKLDNN) is FOSS, so we enable support for
  # it by default. PyTorch currently uses its own vendored version
  # of oneDNN through Intel iDeep.
  USE_MKLDNN = mklDnnSupport;
  USE_MKLDNN_CBLAS = mklDnnSupport;

  preBuild = ''
    export MAX_JOBS=$NIX_BUILD_CORES
    ${python.interpreter} setup.py build --cmake-only
    ${cmake}/bin/cmake build
  '';

  preFixup = ''
    function join_by { local IFS="$1"; shift; echo "$*"; }
    function strip2 {
      IFS=':'
      read -ra RP <<< $(patchelf --print-rpath $1)
      IFS=' '
      RP_NEW=$(join_by : ''${RP[@]:2})
      patchelf --set-rpath \$ORIGIN:''${RP_NEW} "$1"
    }
    for f in $(find ''${out} -name 'libcaffe2*.so')
    do
      strip2 $f
    done
  '';

  # Override the (weirdly) wrong version set by default. See
  # https://github.com/NixOS/nixpkgs/pull/52437#issuecomment-449718038
  # https://github.com/pytorch/pytorch/blob/v1.0.0/setup.py#L267
  PYTORCH_BUILD_VERSION = version;
  PYTORCH_BUILD_NUMBER = 0;

  USE_SYSTEM_NCCL=useSystemNccl;                  # don't build pytorch's third_party NCCL

  # Suppress a weird warning in mkl-dnn, part of ideep in pytorch
  # (upstream seems to have fixed this in the wrong place?)
  # https://github.com/intel/mkl-dnn/commit/8134d346cdb7fe1695a2aa55771071d455fae0bc
  # https://github.com/pytorch/pytorch/issues/22346
  #
  # Also of interest: pytorch ignores CXXFLAGS uses CFLAGS for both C and C++:
  # https://github.com/pytorch/pytorch/blob/v1.2.0/setup.py#L17
  NIX_CFLAGS_COMPILE = lib.optionals (blas.implementation == "mkl") [ "-Wno-error=array-bounds" ];

  nativeBuildInputs = [
    cmake
    util-linux
    which
    ninja
  ] ++ lib.optionals cudaSupport [ cudatoolkit_joined ];

  buildInputs = [ blas blas.provider ]
    ++ lib.optionals cudaSupport [ cudnn magma nccl ]
    ++ lib.optionals stdenv.isLinux [ numactl ];

  propagatedBuildInputs = [
    cffi
    click
    numpy
    pyyaml
    typing-extensions
    # the following are required for tensorboard support
    pillow six future tensorflow-tensorboard protobuf
  ] ++ lib.optionals openMPISupport [ openmpi ]
    ++ lib.optionals (pythonOlder "3.7") [ dataclasses ];

  checkInputs = [ hypothesis ninja psutil ];

  # Tests take a long time and may be flaky, so just sanity-check imports
  doCheck = false;
  pythonImportsCheck = [
    "torch"
  ];

  checkPhase = with lib.versions; with lib.strings; concatStringsSep " " [
    cudaStubEnv
    "${python.interpreter} test/run_test.py"
    "--exclude"
    (concatStringsSep " " [
      "utils" # utils requires git, which is not allowed in the check phase

      # "dataloader" # psutils correctly finds and triggers multiprocessing, but is too sandboxed to run -- resulting in numerous errors
      # ^^^^^^^^^^^^ NOTE: while test_dataloader does return errors, these are acceptable errors and do not interfere with the build

      # tensorboard has acceptable failures for pytorch 1.3.x due to dependencies on tensorboard-plugins
      (optionalString (majorMinor version == "1.3" ) "tensorboard")
    ])
  ];
  postInstall = ''
    mkdir $dev
    cp -r $out/${python.sitePackages}/torch/include $dev/include
    cp -r $out/${python.sitePackages}/torch/share   $dev/share

    # Fix up library paths for split outputs
    substituteInPlace \
      $dev/share/cmake/Torch/TorchConfig.cmake \
      --replace \''${TORCH_INSTALL_PREFIX}/lib "$lib/lib"

    substituteInPlace \
      $dev/share/cmake/Caffe2/Caffe2Targets-release.cmake \
      --replace \''${_IMPORT_PREFIX}/lib "$lib/lib"

    mkdir $lib
    cp -r $out/${python.sitePackages}/torch/lib     $lib/lib
  '';

  postFixup = stdenv.lib.optionalString stdenv.isDarwin ''
    for f in $(ls $lib/lib/*.dylib); do
        install_name_tool -id $lib/lib/$(basename $f) $f || true
    done

    install_name_tool -change @rpath/libshm.dylib $lib/lib/libshm.dylib $lib/lib/libtorch_python.dylib
    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libtorch_python.dylib
    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libtorch_python.dylib

    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libtorch.dylib

    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libcaffe2_observers.dylib
    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libcaffe2_observers.dylib

    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libcaffe2_module_test_dynamic.dylib
    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libcaffe2_module_test_dynamic.dylib

    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libcaffe2_detectron_ops.dylib
    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libcaffe2_detectron_ops.dylib

    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libshm.dylib
    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libshm.dylib
  '';


  meta = {
    description = "Open source, prototype-to-production deep learning platform";
    homepage    = "https://pytorch.org/";
    license     = lib.licenses.bsd3;
    platforms   = with lib.platforms; linux ++ lib.optionals (!cudaSupport) darwin;
    maintainers = with lib.maintainers; [ teh thoughtpolice tscholak ]; # tscholak esp. for darwin-related builds
  };
}
-												python3Packages.pytorch: fixup builds with MKL

- Pass `blas.provider` into `buildInputs`, so that CMake can find the actual
  `mkl` for inspection of its cmake files and headers.

- Add `USE_MKL` correctly when the blas provider is `mkl`.

- Use the MKLDNN and MKLDNN_CBLAS flags by default, since `mkldnn` is FOSS and
  always available..

- Remove a patch for MKL 2019, since we've moved to 2020.

- Add a pythonImportsCheck for "torch" as a basic sanity-check

- Removed some unused variables at the top of the file

											
										
										
											2020-05-03 01:40:27 +01:00
+								{ stdenv, lib, fetchFromGitHub, fetchpatch, buildPythonPackage, python,
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  cudaSupport ? false, cudatoolkit ? null, cudnn ? null, nccl ? null, magma ? null,
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  mklDnnSupport ? true, useSystemNccl ? true,
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  openMPISupport ? false, openmpi ? null,
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  buildDocs ? false,
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  cudaArchList ? null,
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
 								  # Native build inputs
-												utillinux: rename to util-linux

											
										
										
											2020-11-24 15:29:28 +00:00
+								  cmake, util-linux, linkFarm, symlinkJoin, which,
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
 								  # Build inputs
 								  numactl,
 								  # Propagated build inputs
 								  dataclasses, numpy, pyyaml, cffi, click, typing-extensions,
 								  # Unit tests
 								  hypothesis, psutil,
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  # virtual pkg that consistently instantiates blas across nixpkgs
 								  # See https://github.com/NixOS/nixpkgs/pull/83888
 								  blas,
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  # ninja (https://ninja-build.org) must be available to run C++ extensions tests,
 								  ninja,
 								  # dependencies for torch.utils.tensorboard
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  pillow, six, future, tensorflow-tensorboard, protobuf,
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
+								  isPy3k, pythonOlder }:
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								assert !openMPISupport || openmpi != null;
 								# assert that everything needed for cuda is present and that the correct cuda versions are used
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
+								assert !cudaSupport || cudatoolkit != null;
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								assert cudnn == null || cudatoolkit != null;
 								assert !cudaSupport || (let majorIs = lib.versions.major cudatoolkit.version;
-												pytorch: update to use passthru's for checks

This makes the checks a little easier to understand - we can just
check it in the passthru. Also increase major check for cuda 11.

											
										
										
											2020-09-10 20:23:15 +01:00
+								                        in majorIs == "9" || majorIs == "10" || majorIs == "11");
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
 								# confirm that cudatoolkits are sync'd across dependencies
-												pytorch: update to use passthru's for checks

This makes the checks a little easier to understand - we can just
check it in the passthru. Also increase major check for cuda 11.

											
										
										
											2020-09-10 20:23:15 +01:00
+								assert !(openMPISupport && cudaSupport) || openmpi.cudatoolkit == cudatoolkit;
 								assert !cudaSupport || magma.cudatoolkit == cudatoolkit;
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
+								let
 								  cudatoolkit_joined = symlinkJoin {
 								    name = "${cudatoolkit.name}-unsplit";
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								    # nccl is here purely for semantic grouping it could be moved to nativeBuildInputs
 								    paths = [ cudatoolkit.out cudatoolkit.lib nccl.dev nccl.out ];
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
+								  };
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  # Give an explicit list of supported architectures for the build, See:
 								  # - pytorch bug report: https://github.com/pytorch/pytorch/issues/23573
 								  # - pytorch-1.2.0 build on nixpks: https://github.com/NixOS/nixpkgs/pull/65041
 								  #
 								  # This list was selected by omitting the TORCH_CUDA_ARCH_LIST parameter,
 								  # observing the fallback option (which selected all architectures known
 								  # from cudatoolkit_10_0, pytorch-1.2, and python-3.6), and doing a binary
 								  # searching to find offending architectures.
 								  #
 								  # NOTE: Because of sandboxing, this derivation can't auto-detect the hardware's
 								  # cuda architecture, so there is also now a problem around new architectures
 								  # not being supported until explicitly added to this derivation.
 								  #
 								  # FIXME: CMake is throwing the following warning on python-1.2:
 								  #
 								  # ```
 								  # CMake Warning at cmake/public/utils.cmake:172 (message):
 								  #   In the future we will require one to explicitly pass TORCH_CUDA_ARCH_LIST
 								  #   to cmake instead of implicitly setting it as an env variable.  This will
 								  #   become a FATAL_ERROR in future version of pytorch.
 								  # ```
 								  # If this is causing problems for your build, this derivation may have to strip
 								  # away the standard `buildPythonPackage` and use the
 								  # [*Adjust Build Options*](https://github.com/pytorch/pytorch/tree/v1.2.0#adjust-build-options-optional)
 								  # instructions. This will also add more flexibility around configurations
 								  # (allowing FBGEMM to be built in pytorch-1.1), and may future proof this
 								  # derivation.
 								  brokenArchs = [ "3.0" ]; # this variable is only used as documentation.
 								  cuda9ArchList = [
 								    "3.5"
 								    "5.0"
 								    "5.2"
 								    "6.0"
 								    "6.1"
 								    "7.0"
 								    "7.0+PTX"  # I am getting a "undefined architecture compute_75" on cuda 9
 								               # which leads me to believe this is the final cuda-9-compatible architecture.
 								  ];
 								  cuda10ArchList = cuda9ArchList ++ [
 								    "7.5"
 								    "7.5+PTX"  # < most recent architecture as of cudatoolkit_10_0 and pytorch-1.2.0
 								  ];
 								  final_cudaArchList =
 								    if !cudaSupport || cudaArchList != null
 								    then cudaArchList
 								    else
 								      if lib.versions.major cudatoolkit.version == "9"
 								      then cuda9ArchList
 								      else cuda10ArchList; # the assert above removes any ambiguity here.
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
+								  # Normally libcuda.so.1 is provided at runtime by nvidia-x11 via
 								  # LD_LIBRARY_PATH=/run/opengl-driver/lib.  We only use the stub
 								  # libcuda.so from cudatoolkit for running tests, so that we don’t have
 								  # to recompile pytorch on every update to nvidia-x11 or the kernel.
 								  cudaStub = linkFarm "cuda-stub" [{
 								    name = "libcuda.so.1";
 								    path = "${cudatoolkit}/lib/stubs/libcuda.so";
 								  }];
 								  cudaStubEnv = lib.optionalString cudaSupport
-												treewide: Fix unsafe concatenation of $LD_LIBRARY_PATH

Naive concatenation of $LD_LIBRARY_PATH can result in an empty
colon-delimited segment; this tells glibc to load libraries from the
current directory, which is definitely wrong, and may be a security
vulnerability if the current directory is untrusted.  (See #67234, for
example.)  Fix this throughout the tree.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2020-01-02 00:29:34 +00:00
+								    "LD_LIBRARY_PATH=${cudaStub}\${LD_LIBRARY_PATH:+:}$LD_LIBRARY_PATH ";
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
 								in buildPythonPackage rec {
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  pname = "pytorch";
-												pytorch-bin: init at 1.6.0

											
										
										
											2020-08-30 10:34:32 +01:00
+								  # Don't forget to update pytorch-bin to the same version.
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
+								  version = "1.7.0";
-												pytorch-bin: init at 1.6.0

											
										
										
											2020-08-30 10:34:32 +01:00
-												treewide: mark some broken packages as broken

Refs:
e6754980264fe927320d5ff2dbd24ca4fac9a160
1e9cc5b9844ef603fe160e9f671178f96200774f
793a2fe1e8bb886ca2096c5904e1193dc3268b6d
c19cf65261639f749012454932a532aa7c681e4b
f6544d618f30fae0bc4798c4387a8c7c9c047a7c

											
										
										
											2019-10-07 16:20:23 +01:00
+								  disabled = !isPy3k;
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  outputs = [
 								    "out"   # output standard python package
-												python3Packages.pytorch: create separate lib output

At some point pytorch.dev was added to expose the libtorch headers and
libraries to non-Python users of libtorch. However, this output
currently has two disadvantages:

1. An application that compiles against the dev output will also have
   the libtorch header files in its closure. This is not so nice when
   e.g. building Docker images of applications that use libtorch.
2. The dev output has a large transitive closure with many dependencies
   that are not necessary when compiling against libtorch.

This change adds the `lib` output so that applications that only link
against libtorch libraries have a small closure.

Before this change, the libtorch dependency adds 746MiB:

% nix path-info -S `realpath result-dev`
/nix/store/10rmy81bjk628sfpbj2szxlws6brq1xn-python3.8-pytorch-1.5.1-dev   782203848

With this change it is reduced to 196MiB:

% nix path-info -S `realpath result-lib`
/nix/store/bck65lf0z7gdhcf89w1zs5nz333lhgwa-python3.8-pytorch-1.5.1-lib   205865056

											
										
										
											2020-07-07 14:15:46 +01:00
+								    "dev"   # output libtorch headers
 								    "lib"   # output libtorch libraries
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  ];
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  src = fetchFromGitHub {
-												pytorch: 0.1.12 -> 0.2.0

											
										
										
											2017-08-19 02:22:23 +01:00
+								    owner  = "pytorch";
 								    repo   = "pytorch";
 								    rev    = "v${version}";
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
+								    fetchSubmodules = true;
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
+								    sha256 = "0hb11m5kvs4nsi5bc9ijnv6k07593p9dw40rcn33s9vspinrcjd4";
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  };
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
+								  patches = lib.optionals stdenv.isDarwin [
-												python3Packages.pytorch: fix Darwin build by disabling GCD

PyTorch 1.6.0 has updated the vendored pthreadpool library, which has recently
added support for Grand Central Dispatch. Unfortunately, it uses functionality
(DISPATCH_APPLY_AUTO) that is only available since macOS 10.13, whereas we are
still using 10.12 libraries.

We can't directly pass through option to vendored libraries, since the setup.py
scripts creates/filters the options that are passed to CMake. So, instead, this
adds a small patch that disables the GCD functionality in pthreadpool.

											
										
										
											2020-08-05 19:51:05 +01:00
+								    # pthreadpool added support for Grand Central Dispatch in April
 								    # 2020. However, this relies on functionality (DISPATCH_APPLY_AUTO)
 								    # that is available starting with macOS 10.13. However, our current
 								    # base is 10.12. Until we upgrade, we can fall back on the older
 								    # pthread support.
 								    ./pthreadpool-disable-gcd.diff
-												python3Packages.pytorch: fix AArch64 build

aarch64-linux builds fail because of the use of opcodes in QNNPACK
that the GNU assembpler does not support. This change cherry-picks an
upstream patch that fixes this. See:

https://github.com/pytorch/pytorch/issues/33124
https://github.com/pytorch/pytorch/pull/40584

											
										
										
											2020-06-30 06:56:38 +01:00
+								  ];
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
+								  # The dataclasses module is included with Python >= 3.7. This should
 								  # be fixed with the next PyTorch release.
 								  postPatch = ''
 								    substituteInPlace setup.py \
 								      --replace "'dataclasses'" "'dataclasses; python_version < \"3.7\"'"
 								  '';
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
+								  preConfigure = lib.optionalString cudaSupport ''
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								    export TORCH_CUDA_ARCH_LIST="${lib.strings.concatStringsSep ";" final_cudaArchList}"
-												pytorch: 0.3.1 -> 0.4.0

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 23:00:50 +01:00
+								    export CC=${cudatoolkit.cc}/bin/gcc CXX=${cudatoolkit.cc}/bin/g++
-												pytorch: 0.2.0 → 0.3.1 with CUDA and cuDNN (#38530)

* pytorch-0.3 with optional cuda and cudnn

* pytorch tests reenabled if compiling without cuda

* pytorch: Conditionalize cudnn dependency on cudaSupport

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Compile with the same GCC version used by CUDA if cudaSupport

Fixes this error:

In file included from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/host_config.h:50:0,
                 from /nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/cuda_runtime.h:78,
                 from <command-line>:0:
/nix/store/gv7w3c71jg627cpcff04yi6kwzpzjyap-cudatoolkit-9.1.85.1/include/crt/host_config.h:121:2: error: #error -- unsupported GNU version! gcc versions later than 6 are not supported!
 #error -- unsupported GNU version! gcc versions later than 6 are not supported!
  ^~~~~

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Build with joined cudatoolkit

Similar to #30058 for TensorFlow.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: 0.3.0 -> 0.3.1

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Patch for “refcounted file mapping not supported” failure

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Skip distributed tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

* pytorch: Use the stub libcuda.so from cudatoolkit for running tests

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2018-05-04 15:19:31 +01:00
+								  '' + lib.optionalString (cudaSupport && cudnn != null) ''
 								    export CUDNN_INCLUDE_DIR=${cudnn}/include
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  '';
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  # Use pytorch's custom configurations
 								  dontUseCmakeConfigure = true;
 								  BUILD_NAMEDTENSOR = true;
 								  BUILD_DOCS = buildDocs;
-												python3Packages.pytorch: fixup builds with MKL

- Pass `blas.provider` into `buildInputs`, so that CMake can find the actual
  `mkl` for inspection of its cmake files and headers.

- Add `USE_MKL` correctly when the blas provider is `mkl`.

- Use the MKLDNN and MKLDNN_CBLAS flags by default, since `mkldnn` is FOSS and
  always available..

- Remove a patch for MKL 2019, since we've moved to 2020.

- Add a pythonImportsCheck for "torch" as a basic sanity-check

- Removed some unused variables at the top of the file

											
										
										
											2020-05-03 01:40:27 +01:00
 								  USE_MKL = blas.implementation == "mkl";
-												python3Packages.pytorch: remove oneDNN dependency

oneDNN was added as a dependency, but it is not actually used by
PyTorch. PyTorch uses oneDNN from the vendored iDeep dependency.

Using a system-provided oneDNN is currently not a supported build
option.

											
										
										
											2020-08-26 09:46:22 +01:00
+								  # Unlike MKL, oneDNN (née MKLDNN) is FOSS, so we enable support for
 								  # it by default. PyTorch currently uses its own vendored version
 								  # of oneDNN through Intel iDeep.
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  USE_MKLDNN = mklDnnSupport;
-												python3Packages.pytorch: fixup builds with MKL

- Pass `blas.provider` into `buildInputs`, so that CMake can find the actual
  `mkl` for inspection of its cmake files and headers.

- Add `USE_MKL` correctly when the blas provider is `mkl`.

- Use the MKLDNN and MKLDNN_CBLAS flags by default, since `mkldnn` is FOSS and
  always available..

- Remove a patch for MKL 2019, since we've moved to 2020.

- Add a pythonImportsCheck for "torch" as a basic sanity-check

- Removed some unused variables at the top of the file

											
										
										
											2020-05-03 01:40:27 +01:00
+								  USE_MKLDNN_CBLAS = mklDnnSupport;
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  preBuild = ''
 								    export MAX_JOBS=$NIX_BUILD_CORES
 								    ${python.interpreter} setup.py build --cmake-only
 								    ${cmake}/bin/cmake build
 								  '';
-												pytorch-0.4 rpath fix, some tests reenabled

											
										
										
											2018-09-12 08:22:52 +01:00
+								  preFixup = ''
 								    function join_by { local IFS="$1"; shift; echo "$*"; }
 								    function strip2 {
 								      IFS=':'
 								      read -ra RP <<< $(patchelf --print-rpath $1)
 								      IFS=' '
 								      RP_NEW=$(join_by : ''${RP[@]:2})
 								      patchelf --set-rpath \$ORIGIN:''${RP_NEW} "$1"
 								    }
 								    for f in $(find ''${out} -name 'libcaffe2*.so')
 								    do
 								      strip2 $f
 								    done
 								  '';
-												pythonPackages.pytorch: fix weirdly broken wheel version number

Otherwise, the wheel gets built with invalid metadata -- causing
'torch >= 1.0.0' to be unsatisfiable in other python packages, for
instance.

Signed-off-by: Austin Seipp <aseipp@pobox.com>

											
										
										
											2018-12-24 11:46:51 +00:00
+								  # Override the (weirdly) wrong version set by default. See
 								  # https://github.com/NixOS/nixpkgs/pull/52437#issuecomment-449718038
 								  # https://github.com/pytorch/pytorch/blob/v1.0.0/setup.py#L267
 								  PYTORCH_BUILD_VERSION = version;
 								  PYTORCH_BUILD_NUMBER = 0;
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  USE_SYSTEM_NCCL=useSystemNccl;                  # don't build pytorch's third_party NCCL
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												pythonPackages.pytorch: fix Intel MKL BLAS compile failure

Signed-off-by: Austin Seipp <aseipp@pobox.com>

											
										
										
											2018-12-25 02:00:13 +00:00
+								  # Suppress a weird warning in mkl-dnn, part of ideep in pytorch
 								  # (upstream seems to have fixed this in the wrong place?)
 								  # https://github.com/intel/mkl-dnn/commit/8134d346cdb7fe1695a2aa55771071d455fae0bc
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  # https://github.com/pytorch/pytorch/issues/22346
 								  #
 								  # Also of interest: pytorch ignores CXXFLAGS uses CFLAGS for both C and C++:
 								  # https://github.com/pytorch/pytorch/blob/v1.2.0/setup.py#L17
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  NIX_CFLAGS_COMPILE = lib.optionals (blas.implementation == "mkl") [ "-Wno-error=array-bounds" ];
-												pythonPackages.pytorch: fix Intel MKL BLAS compile failure

Signed-off-by: Austin Seipp <aseipp@pobox.com>

											
										
										
											2018-12-25 02:00:13 +00:00
-												pytorch: Use nativeBuildInputs to specify binary build dependencies.

											
										
										
											2019-03-06 21:34:26 +00:00
+								  nativeBuildInputs = [
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								    cmake
-												utillinux: rename to util-linux

											
										
										
											2020-11-24 15:29:28 +00:00
+								    util-linux
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								    which
 								    ninja
-												pytorch: Move cudatoolkit to nativeBuildInputs

nvcc must be available in PATH at build time; otherwise CUDA support
will be disabled.

Signed-off-by: Anders Kaseorg <andersk@mit.edu>

											
										
										
											2019-04-22 03:31:55 +01:00
+								  ] ++ lib.optionals cudaSupport [ cudatoolkit_joined ];
-												pytorch: Use nativeBuildInputs to specify binary build dependencies.

											
										
										
											2019-03-06 21:34:26 +00:00
-												python3Packages.pytorch: remove oneDNN dependency

oneDNN was added as a dependency, but it is not actually used by
PyTorch. PyTorch uses oneDNN from the vendored iDeep dependency.

Using a system-provided oneDNN is currently not a supported build
option.

											
										
										
											2020-08-26 09:46:22 +01:00
+								  buildInputs = [ blas blas.provider ]
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								    ++ lib.optionals cudaSupport [ cudnn magma nccl ]
-												pythonPackages.pytorch: add libnuma dep on Linux

Signed-off-by: Austin Seipp <aseipp@pobox.com>

											
										
										
											2018-12-25 01:59:40 +00:00
+								    ++ lib.optionals stdenv.isLinux [ numactl ];
-												pytorch: fix sha256 hash

											
										
										
											2017-11-22 22:02:34 +00:00
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  propagatedBuildInputs = [
 								    cffi
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								    click
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								    numpy
 								    pyyaml
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
+								    typing-extensions
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								    # the following are required for tensorboard support
 								    pillow six future tensorflow-tensorboard protobuf
-												python3Packages.pytorch: 1.6.0 -> 1.7.0

Changelog:

https://github.com/pytorch/pytorch/releases/tag/v1.7.0

											
										
										
											2020-10-28 10:58:55 +00:00
+								  ] ++ lib.optionals openMPISupport [ openmpi ]
 								    ++ lib.optionals (pythonOlder "3.7") [ dataclasses ];
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  checkInputs = [ hypothesis ninja psutil ];
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												python3Packages.pytorch: fixup builds with MKL

- Pass `blas.provider` into `buildInputs`, so that CMake can find the actual
  `mkl` for inspection of its cmake files and headers.

- Add `USE_MKL` correctly when the blas provider is `mkl`.

- Use the MKLDNN and MKLDNN_CBLAS flags by default, since `mkldnn` is FOSS and
  always available..

- Remove a patch for MKL 2019, since we've moved to 2020.

- Add a pythonImportsCheck for "torch" as a basic sanity-check

- Removed some unused variables at the top of the file

											
										
										
											2020-05-03 01:40:27 +01:00
+								  # Tests take a long time and may be flaky, so just sanity-check imports
 								  doCheck = false;
 								  pythonImportsCheck = [
 								    "torch"
 								  ];
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								  checkPhase = with lib.versions; with lib.strings; concatStringsSep " " [
 								    cudaStubEnv
 								    "${python.interpreter} test/run_test.py"
 								    "--exclude"
 								    (concatStringsSep " " [
 								      "utils" # utils requires git, which is not allowed in the check phase
 								      # "dataloader" # psutils correctly finds and triggers multiprocessing, but is too sandboxed to run -- resulting in numerous errors
 								      # ^^^^^^^^^^^^ NOTE: while test_dataloader does return errors, these are acceptable errors and do not interfere with the build
 								      # tensorboard has acceptable failures for pytorch 1.3.x due to dependencies on tensorboard-plugins
 								      (optionalString (majorMinor version == "1.3" ) "tensorboard")
 								    ])
 								  ];
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  postInstall = ''
 								    mkdir $dev
 								    cp -r $out/${python.sitePackages}/torch/include $dev/include
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								    cp -r $out/${python.sitePackages}/torch/share   $dev/share
-												python3Packages.pytorch: create separate lib output

At some point pytorch.dev was added to expose the libtorch headers and
libraries to non-Python users of libtorch. However, this output
currently has two disadvantages:

1. An application that compiles against the dev output will also have
   the libtorch header files in its closure. This is not so nice when
   e.g. building Docker images of applications that use libtorch.
2. The dev output has a large transitive closure with many dependencies
   that are not necessary when compiling against libtorch.

This change adds the `lib` output so that applications that only link
against libtorch libraries have a small closure.

Before this change, the libtorch dependency adds 746MiB:

% nix path-info -S `realpath result-dev`
/nix/store/10rmy81bjk628sfpbj2szxlws6brq1xn-python3.8-pytorch-1.5.1-dev   782203848

With this change it is reduced to 196MiB:

% nix path-info -S `realpath result-lib`
/nix/store/bck65lf0z7gdhcf89w1zs5nz333lhgwa-python3.8-pytorch-1.5.1-lib   205865056

											
										
										
											2020-07-07 14:15:46 +01:00
-												python3Packages.pytorch: Fix CMake files for split outputs

Fixes #102146

											
										
										
											2020-12-03 07:30:18 +00:00
+								    # Fix up library paths for split outputs
 								    substituteInPlace \
 								      $dev/share/cmake/Torch/TorchConfig.cmake \
 								      --replace \''${TORCH_INSTALL_PREFIX}/lib "$lib/lib"
 								    substituteInPlace \
 								      $dev/share/cmake/Caffe2/Caffe2Targets-release.cmake \
 								      --replace \''${_IMPORT_PREFIX}/lib "$lib/lib"
-												python3Packages.pytorch: create separate lib output

At some point pytorch.dev was added to expose the libtorch headers and
libraries to non-Python users of libtorch. However, this output
currently has two disadvantages:

1. An application that compiles against the dev output will also have
   the libtorch header files in its closure. This is not so nice when
   e.g. building Docker images of applications that use libtorch.
2. The dev output has a large transitive closure with many dependencies
   that are not necessary when compiling against libtorch.

This change adds the `lib` output so that applications that only link
against libtorch libraries have a small closure.

Before this change, the libtorch dependency adds 746MiB:

% nix path-info -S `realpath result-dev`
/nix/store/10rmy81bjk628sfpbj2szxlws6brq1xn-python3.8-pytorch-1.5.1-dev   782203848

With this change it is reduced to 196MiB:

% nix path-info -S `realpath result-lib`
/nix/store/bck65lf0z7gdhcf89w1zs5nz333lhgwa-python3.8-pytorch-1.5.1-lib   205865056

											
										
										
											2020-07-07 14:15:46 +01:00
+								    mkdir $lib
 								    cp -r $out/${python.sitePackages}/torch/lib     $lib/lib
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								  '';
 								  postFixup = stdenv.lib.optionalString stdenv.isDarwin ''
-												python3Packages.pytorch: fix library names in lib output on Darwin

The library name fixup was attempted on the dev output, whereas it should be
applied to the lib output.

											
										
										
											2020-08-06 09:02:46 +01:00
+								    for f in $(ls $lib/lib/*.dylib); do
 								        install_name_tool -id $lib/lib/$(basename $f) $f || true
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								    done
-												python3Packages.pytorch: fix library names in lib output on Darwin

The library name fixup was attempted on the dev output, whereas it should be
applied to the lib output.

											
										
										
											2020-08-06 09:02:46 +01:00
+								    install_name_tool -change @rpath/libshm.dylib $lib/lib/libshm.dylib $lib/lib/libtorch_python.dylib
 								    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libtorch_python.dylib
 								    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libtorch_python.dylib
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
-												python3Packages.pytorch: fix library names in lib output on Darwin

The library name fixup was attempted on the dev output, whereas it should be
applied to the lib output.

											
										
										
											2020-08-06 09:02:46 +01:00
+								    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libtorch.dylib
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												python3Packages.pytorch: fix library names in lib output on Darwin

The library name fixup was attempted on the dev output, whereas it should be
applied to the lib output.

											
										
										
											2020-08-06 09:02:46 +01:00
+								    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libcaffe2_observers.dylib
 								    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libcaffe2_observers.dylib
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												python3Packages.pytorch: fix library names in lib output on Darwin

The library name fixup was attempted on the dev output, whereas it should be
applied to the lib output.

											
										
										
											2020-08-06 09:02:46 +01:00
+								    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libcaffe2_module_test_dynamic.dylib
 								    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libcaffe2_module_test_dynamic.dylib
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												python3Packages.pytorch: fix library names in lib output on Darwin

The library name fixup was attempted on the dev output, whereas it should be
applied to the lib output.

											
										
										
											2020-08-06 09:02:46 +01:00
+								    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libcaffe2_detectron_ops.dylib
 								    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libcaffe2_detectron_ops.dylib
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												python3Packages.pytorch: fix library names in lib output on Darwin

The library name fixup was attempted on the dev output, whereas it should be
applied to the lib output.

											
										
										
											2020-08-06 09:02:46 +01:00
+								    install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libshm.dylib
 								    install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libshm.dylib
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  '';
-												pytorch: fix sha256 hash

											
										
										
											2017-11-22 22:02:34 +00:00
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  meta = {
-												pythonPackages.pytorch: meta touch up, add myself as maintainer

Signed-off-by: Austin Seipp <aseipp@pobox.com>

											
										
										
											2018-12-25 01:58:04 +00:00
+								    description = "Open source, prototype-to-production deep learning platform";
-												treewide: Per RFC45, remove all unquoted URLs

											
										
										
											2020-04-01 02:11:51 +01:00
+								    homepage    = "https://pytorch.org/";
-												pythonPackages.pytorch: meta touch up, add myself as maintainer

Signed-off-by: Austin Seipp <aseipp@pobox.com>

											
										
										
											2018-12-25 01:58:04 +00:00
+								    license     = lib.licenses.bsd3;
-												python3Packages.pytorch: 1.0.0 -> 1.2.0

											
										
										
											2019-10-20 22:07:04 +01:00
+								    platforms   = with lib.platforms; linux ++ lib.optionals (!cudaSupport) darwin;
-												pytorch: 1.2.0 -> 1.4.1

Co-authored-by: Benjamin Hipple <bhipple@protonmail.com>

											
										
										
											2019-12-17 17:55:43 +00:00
+								    maintainers = with lib.maintainers; [ teh thoughtpolice tscholak ]; # tscholak esp. for darwin-related builds
-												python.pkgs.pytorch: init at 0.1.12

											
										
										
											2017-07-16 20:15:05 +01:00
+								  };
 								}