pkgs/development/python-modules/tensorflow/default.nix at 23.05-pre · pyrox.dev/nixpkgs

pyrox.dev / nixpkgs
lol
nixpkgs / pkgs / development / python-modules / tensorflow / default.nix
at 23.05-pre 16 kB view raw
  1{ stdenv, bazel_5, buildBazelPackage, isPy3k, lib, fetchFromGitHub, symlinkJoin
  2, addOpenGLRunpath, fetchpatch, patchelfUnstable
  3# Python deps
  4, buildPythonPackage, pythonOlder, python
  5# Python libraries
  6, numpy, tensorboard, absl-py
  7, packaging, setuptools, wheel, keras, keras-preprocessing, google-pasta
  8, opt-einsum, astunparse, h5py
  9, termcolor, grpcio, six, wrapt, protobuf-python, tensorflow-estimator
 10, dill, flatbuffers-python, portpicker, tblib, typing-extensions
 11# Common deps
 12, git, pybind11, which, binutils, glibcLocales, cython, perl
 13# Common libraries
 14, jemalloc, mpi, gast, grpc, sqlite, boringssl, jsoncpp, nsync
 15, curl, snappy, flatbuffers-core, lmdb-core, icu, double-conversion, libpng, libjpeg_turbo, giflib, protobuf-core
 16# Upstream by default includes cuda support since tensorflow 1.15. We could do
 17# that in nix as well. It would make some things easier and less confusing, but
 18# it would also make the default tensorflow package unfree. See
 19# https://groups.google.com/a/tensorflow.org/forum/#!topic/developers/iRCt5m4qUz0
 20, cudaSupport ? false, cudaPackages ? {}
 21, mklSupport ? false, mkl ? null
 22, tensorboardSupport ? true
 23# XLA without CUDA is broken
 24, xlaSupport ? cudaSupport
 25# Default from ./configure script
 26, cudaCapabilities ? [ "sm_35" "sm_50" "sm_60" "sm_70" "sm_75" "compute_80" ]
 27, sse42Support ? stdenv.hostPlatform.sse4_2Support
 28, avx2Support  ? stdenv.hostPlatform.avx2Support
 29, fmaSupport   ? stdenv.hostPlatform.fmaSupport
 30# Darwin deps
 31, Foundation, Security, cctools, llvmPackages_11
 32}:
 33
 34let
 35  inherit (cudaPackages) cudatoolkit cudnn nccl;
 36in
 37
 38assert cudaSupport -> cudatoolkit != null
 39                   && cudnn != null;
 40
 41# unsupported combination
 42assert ! (stdenv.isDarwin && cudaSupport);
 43
 44assert mklSupport -> mkl != null;
 45
 46let
 47  withTensorboard = (pythonOlder "3.6") || tensorboardSupport;
 48
 49  cudatoolkit_joined = symlinkJoin {
 50    name = "${cudatoolkit.name}-merged";
 51    paths = [
 52      cudatoolkit.lib
 53      cudatoolkit.out
 54    ] ++ lib.optionals (lib.versionOlder cudatoolkit.version "11") [
 55      # for some reason some of the required libs are in the targets/x86_64-linux
 56      # directory; not sure why but this works around it
 57      "${cudatoolkit}/targets/${stdenv.system}"
 58    ];
 59  };
 60
 61  cudatoolkit_cc_joined = symlinkJoin {
 62    name = "${cudatoolkit.cc.name}-merged";
 63    paths = [
 64      cudatoolkit.cc
 65      binutils.bintools # for ar, dwp, nm, objcopy, objdump, strip
 66    ];
 67  };
 68
 69  # Needed for _some_ system libraries, grep INCLUDEDIR.
 70  includes_joined = symlinkJoin {
 71    name = "tensorflow-deps-merged";
 72    paths = [
 73      jsoncpp
 74    ];
 75  };
 76
 77  tfFeature = x: if x then "1" else "0";
 78
 79  version = "2.10.0";
 80  variant = if cudaSupport then "-gpu" else "";
 81  pname = "tensorflow${variant}";
 82
 83  pythonEnv = python.withPackages (_:
 84    [ # python deps needed during wheel build time (not runtime, see the buildPythonPackage part for that)
 85      # This list can likely be shortened, but each trial takes multiple hours so won't bother for now.
 86      absl-py
 87      astunparse
 88      dill
 89      flatbuffers-python
 90      gast
 91      google-pasta
 92      grpcio
 93      h5py
 94      keras-preprocessing
 95      numpy
 96      opt-einsum
 97      packaging
 98      protobuf-python
 99      setuptools
100      six
101      tblib
102      tensorboard
103      tensorflow-estimator
104      termcolor
105      typing-extensions
106      wheel
107      wrapt
108  ]);
109
110  rules_cc_darwin_patched = stdenv.mkDerivation {
111    name = "rules_cc-${pname}-${version}";
112
113    src = _bazel-build.deps;
114
115    prePatch = "pushd rules_cc";
116    patches = [
117      # https://github.com/bazelbuild/rules_cc/issues/122
118      (fetchpatch {
119        name = "tensorflow-rules_cc-libtool-path.patch";
120        url = "https://github.com/bazelbuild/rules_cc/commit/8c427ab30bf213630dc3bce9d2e9a0e29d1787db.diff";
121        sha256 = "sha256-C4v6HY5+jm0ACUZ58gBPVejCYCZfuzYKlHZ0m2qDHCk=";
122      })
123
124      # https://github.com/bazelbuild/rules_cc/pull/124
125      (fetchpatch {
126        name = "tensorflow-rules_cc-install_name_tool-path.patch";
127        url = "https://github.com/bazelbuild/rules_cc/commit/156497dc89100db8a3f57b23c63724759d431d05.diff";
128        sha256 = "sha256-NES1KeQmMiUJQVoV6dS4YGRxxkZEjOpFSCyOq9HZYO0=";
129      })
130    ];
131    postPatch = "popd";
132
133    dontConfigure = true;
134    dontBuild = true;
135
136    installPhase = ''
137      runHook preInstall
138
139      mv rules_cc/ "$out"
140
141      runHook postInstall
142    '';
143  };
144  llvm-raw_darwin_patched = stdenv.mkDerivation {
145    name = "llvm-raw-${pname}-${version}";
146
147    src = _bazel-build.deps;
148
149    prePatch = "pushd llvm-raw";
150    patches = [
151      # Fix a vendored config.h that requires the 10.13 SDK
152      ./llvm_bazel_fix_macos_10_12_sdk.patch
153    ];
154    postPatch = ''
155      touch {BUILD,WORKSPACE}
156      popd
157    '';
158
159    dontConfigure = true;
160    dontBuild = true;
161
162    installPhase = ''
163      runHook preInstall
164
165      mv llvm-raw/ "$out"
166
167      runHook postInstall
168    '';
169  };
170  bazel-build = if stdenv.isDarwin then _bazel-build.overrideAttrs (prev: {
171    bazelBuildFlags = prev.bazelBuildFlags ++ [
172      "--override_repository=rules_cc=${rules_cc_darwin_patched}"
173      "--override_repository=llvm-raw=${llvm-raw_darwin_patched}"
174    ];
175    preBuild = ''
176      export AR="${cctools}/bin/libtool"
177    '';
178  }) else _bazel-build;
179
180  _bazel-build = (buildBazelPackage.override (lib.optionalAttrs stdenv.isDarwin {
181    # clang 7 fails to emit a symbol for
182    # __ZN4llvm11SmallPtrSetIPKNS_10AllocaInstELj8EED1Ev in any of the
183    # translation units, so the build fails at link time
184    stdenv = llvmPackages_11.stdenv;
185  })) {
186    name = "${pname}-${version}";
187    bazel = bazel_5;
188
189    src = fetchFromGitHub {
190      owner = "tensorflow";
191      repo = "tensorflow";
192      rev = "v${version}";
193      hash = "sha256-Y6cujiMoQXKQlsLBr7d0T278ltdd00IfsTRycJbRVN4=";
194    };
195
196    # On update, it can be useful to steal the changes from gentoo
197    # https://gitweb.gentoo.org/repo/gentoo.git/tree/sci-libs/tensorflow
198
199    nativeBuildInputs = [
200      which pythonEnv cython perl protobuf-core
201    ] ++ lib.optional cudaSupport addOpenGLRunpath;
202
203    buildInputs = [
204      jemalloc
205      mpi
206      glibcLocales
207      git
208
209      # libs taken from system through the TF_SYS_LIBS mechanism
210      boringssl
211      curl
212      double-conversion
213      flatbuffers-core
214      giflib
215      grpc
216      icu
217      jsoncpp
218      libjpeg_turbo
219      libpng
220      lmdb-core
221      pybind11
222      snappy
223      sqlite
224    ] ++ lib.optionals cudaSupport [
225      cudatoolkit
226      cudnn
227    ] ++ lib.optionals mklSupport [
228      mkl
229    ] ++ lib.optionals stdenv.isDarwin [
230      Foundation
231      Security
232    ] ++ lib.optionals (!stdenv.isDarwin) [
233      nsync
234    ];
235
236    # arbitrarily set to the current latest bazel version, overly careful
237    TF_IGNORE_MAX_BAZEL_VERSION = true;
238
239    # Take as many libraries from the system as possible. Keep in sync with
240    # list of valid syslibs in
241    # https://github.com/tensorflow/tensorflow/blob/master/third_party/systemlibs/syslibs_configure.bzl
242    TF_SYSTEM_LIBS = lib.concatStringsSep "," ([
243      "absl_py"
244      "astor_archive"
245      "astunparse_archive"
246      "boringssl"
247      # Not packaged in nixpkgs
248      # "com_github_googleapis_googleapis"
249      # "com_github_googlecloudplatform_google_cloud_cpp"
250      "com_github_grpc_grpc"
251      "com_google_protobuf"
252      # Fails with the error: external/org_tensorflow/tensorflow/core/profiler/utils/tf_op_utils.cc:46:49: error: no matching function for call to 're2::RE2::FullMatch(absl::lts_2020_02_25::string_view&, re2::RE2&)'
253      # "com_googlesource_code_re2"
254      "curl"
255      "cython"
256      "dill_archive"
257      "double_conversion"
258      "flatbuffers"
259      "functools32_archive"
260      "gast_archive"
261      "gif"
262      "hwloc"
263      "icu"
264      "jsoncpp_git"
265      "libjpeg_turbo"
266      "lmdb"
267      "nasm"
268      "opt_einsum_archive"
269      "org_sqlite"
270      "pasta"
271      "png"
272      "pybind11"
273      "six_archive"
274      "snappy"
275      "tblib_archive"
276      "termcolor_archive"
277      "typing_extensions_archive"
278      "wrapt"
279      "zlib"
280    ] ++ lib.optionals (!stdenv.isDarwin) [
281      "nsync" # fails to build on darwin
282    ]);
283
284    INCLUDEDIR = "${includes_joined}/include";
285
286    # This is needed for the Nix-provided protobuf dependency to work,
287    # as otherwise the rule `link_proto_files` tries to create the links
288    # to `/usr/include/...` which results in build failures.
289    PROTOBUF_INCLUDE_PATH = "${protobuf-core}/include";
290
291    PYTHON_BIN_PATH = pythonEnv.interpreter;
292
293    TF_NEED_GCP = true;
294    TF_NEED_HDFS = true;
295    TF_ENABLE_XLA = tfFeature xlaSupport;
296
297    CC_OPT_FLAGS = " ";
298
299    # https://github.com/tensorflow/tensorflow/issues/14454
300    TF_NEED_MPI = tfFeature cudaSupport;
301
302    TF_NEED_CUDA = tfFeature cudaSupport;
303    TF_CUDA_PATHS = lib.optionalString cudaSupport "${cudatoolkit_joined},${cudnn},${nccl}";
304    GCC_HOST_COMPILER_PREFIX = lib.optionalString cudaSupport "${cudatoolkit_cc_joined}/bin";
305    GCC_HOST_COMPILER_PATH = lib.optionalString cudaSupport "${cudatoolkit_cc_joined}/bin/gcc";
306    TF_CUDA_COMPUTE_CAPABILITIES = lib.concatStringsSep "," cudaCapabilities;
307
308    postPatch = ''
309      # bazel 3.3 should work just as well as bazel 3.1
310      rm -f .bazelversion
311    '' + lib.optionalString (!withTensorboard) ''
312      # Tensorboard pulls in a bunch of dependencies, some of which may
313      # include security vulnerabilities. So we make it optional.
314      # https://github.com/tensorflow/tensorflow/issues/20280#issuecomment-400230560
315      sed -i '/tensorboard ~=/d' tensorflow/tools/pip_package/setup.py
316    '';
317
318    # https://github.com/tensorflow/tensorflow/pull/39470
319    NIX_CFLAGS_COMPILE = [ "-Wno-stringop-truncation" ];
320
321    preConfigure = let
322      opt_flags = []
323        ++ lib.optionals sse42Support ["-msse4.2"]
324        ++ lib.optionals avx2Support ["-mavx2"]
325        ++ lib.optionals fmaSupport ["-mfma"];
326    in ''
327      patchShebangs configure
328
329      # dummy ldconfig
330      mkdir dummy-ldconfig
331      echo "#!${stdenv.shell}" > dummy-ldconfig/ldconfig
332      chmod +x dummy-ldconfig/ldconfig
333      export PATH="$PWD/dummy-ldconfig:$PATH"
334
335      export PYTHON_LIB_PATH="$NIX_BUILD_TOP/site-packages"
336      export CC_OPT_FLAGS="${lib.concatStringsSep " " opt_flags}"
337      mkdir -p "$PYTHON_LIB_PATH"
338
339      # To avoid mixing Python 2 and Python 3
340      unset PYTHONPATH
341    '';
342
343    configurePhase = ''
344      runHook preConfigure
345      ./configure
346      runHook postConfigure
347    '';
348
349    hardeningDisable = [ "format" ];
350
351    bazelBuildFlags = [
352      "--config=opt" # optimize using the flags set in the configure phase
353    ]
354    ++ lib.optionals stdenv.cc.isClang [
355      "--cxxopt=-x" "--cxxopt=c++"
356      "--host_cxxopt=-x" "--host_cxxopt=c++"
357
358      # workaround for https://github.com/bazelbuild/bazel/issues/15359
359      "--spawn_strategy=sandboxed"
360    ]
361    ++ lib.optionals (mklSupport) [ "--config=mkl" ];
362
363    bazelTarget = "//tensorflow/tools/pip_package:build_pip_package //tensorflow/tools/lib_package:libtensorflow";
364
365    removeRulesCC = false;
366    # Without this Bazel complaints about sandbox violations.
367    dontAddBazelOpts = true;
368
369    fetchAttrs = {
370      # cudaSupport causes fetch of ncclArchive, resulting in different hashes
371      sha256 = if cudaSupport then
372        "sha256-KtVReqHL3zxE8TPrqIerSOt59Mgke/ftoFZKMzgX/u8="
373      else
374        if stdenv.isDarwin then
375          # FIXME: this checksum is currently wrong, since the tensorflow dependency fetch is broken on darwin
376          "sha256-j2k9Q+k41nq5nP1VjjkkNjXRov1uAda4RCMDMAthjr0="
377        else
378          "sha256-zH3xNFEU2JR0Ww8bpD4mCiorGtao0WVPP4vklVMgS4A=";
379    };
380
381    buildAttrs = {
382      outputs = [ "out" "python" ];
383
384      preBuild = ''
385        patchShebangs .
386      '';
387
388      installPhase = ''
389        mkdir -p "$out"
390        tar -xf bazel-bin/tensorflow/tools/lib_package/libtensorflow.tar.gz -C "$out"
391        # Write pkgconfig file.
392        mkdir "$out/lib/pkgconfig"
393        cat > "$out/lib/pkgconfig/tensorflow.pc" << EOF
394        Name: TensorFlow
395        Version: ${version}
396        Description: Library for computation using data flow graphs for scalable machine learning
397        Requires:
398        Libs: -L$out/lib -ltensorflow
399        Cflags: -I$out/include/tensorflow
400        EOF
401
402        # build the source code, then copy it to $python (build_pip_package
403        # actually builds a symlink farm so we must dereference them).
404        bazel-bin/tensorflow/tools/pip_package/build_pip_package --src "$PWD/dist"
405        cp -Lr "$PWD/dist" "$python"
406      '';
407
408      postFixup = lib.optionalString cudaSupport ''
409        find $out -type f \( -name '*.so' -or -name '*.so.*' \) | while read lib; do
410          addOpenGLRunpath "$lib"
411        done
412      '';
413
414      requiredSystemFeatures = [
415        "big-parallel"
416      ];
417    };
418
419    meta = with lib; {
420      description = "Computation using data flow graphs for scalable machine learning";
421      homepage = "http://tensorflow.org";
422      license = licenses.asl20;
423      maintainers = with maintainers; [ jyp abbradar ];
424      platforms = with platforms; linux ++ darwin;
425      broken = !(xlaSupport -> cudaSupport);
426    } // lib.optionalAttrs stdenv.isDarwin {
427      timeout = 86400; # 24 hours
428      maxSilent = 14400; # 4h, double the default of 7200s
429    };
430  };
431
432in buildPythonPackage {
433  inherit version pname;
434  disabled = !isPy3k;
435
436  src = bazel-build.python;
437
438  # Adjust dependency requirements:
439  # - Relax flatbuffers and gast version requirements
440  # - The purpose of python3Packages.libclang is not clear at the moment and we don't have it packaged yet
441  # - keras and tensorlow-io-gcs-filesystem will be considered as optional for now.
442  postPatch = ''
443    sed -i setup.py \
444      -e "s/'flatbuffers[^']*',/'flatbuffers',/" \
445      -e "s/'gast[^']*',/'gast',/" \
446      -e "/'libclang[^']*',/d" \
447      -e "/'keras[^']*')\?,/d" \
448      -e "/'tensorflow-io-gcs-filesystem[^']*',/d" \
449      -e "s/'protobuf[^']*',/'protobuf',/" \
450  '';
451
452  # Upstream has a pip hack that results in bin/tensorboard being in both tensorflow
453  # and the propagated input tensorboard, which causes environment collisions.
454  # Another possibility would be to have tensorboard only in the buildInputs
455  # https://github.com/tensorflow/tensorflow/blob/v1.7.1/tensorflow/tools/pip_package/setup.py#L79
456  postInstall = ''
457    rm $out/bin/tensorboard
458  '';
459
460  setupPyGlobalFlags = [ "--project_name ${pname}" ];
461
462  # tensorflow/tools/pip_package/setup.py
463  propagatedBuildInputs = [
464    absl-py
465    astunparse
466    flatbuffers-python
467    gast
468    google-pasta
469    grpcio
470    h5py
471    keras-preprocessing
472    numpy
473    opt-einsum
474    packaging
475    protobuf-python
476    six
477    tensorflow-estimator
478    termcolor
479    typing-extensions
480    wrapt
481  ] ++ lib.optionals withTensorboard [
482    tensorboard
483  ];
484
485  # remove patchelfUnstable once patchelf 0.14 with https://github.com/NixOS/patchelf/pull/256 becomes the default
486  nativeBuildInputs = lib.optionals cudaSupport [ addOpenGLRunpath patchelfUnstable ];
487
488  postFixup = lib.optionalString cudaSupport ''
489    find $out -type f \( -name '*.so' -or -name '*.so.*' \) | while read lib; do
490      addOpenGLRunpath "$lib"
491
492      patchelf --set-rpath "${cudatoolkit}/lib:${cudatoolkit.lib}/lib:${cudnn}/lib:${nccl}/lib:$(patchelf --print-rpath "$lib")" "$lib"
493    done
494  '';
495
496  # Actual tests are slow and impure.
497  # TODO try to run them anyway
498  # TODO better test (files in tensorflow/tools/ci_build/builds/*test)
499  # TEST_PACKAGES in tensorflow/tools/pip_package/setup.py
500  checkInputs = [
501    dill
502    keras
503    portpicker
504    tblib
505  ];
506  checkPhase = ''
507    ${python.interpreter} <<EOF
508    # A simple "Hello world"
509    import tensorflow as tf
510    hello = tf.constant("Hello, world!")
511    tf.print(hello)
512
513    # Fit a simple model to random data
514    import numpy as np
515    np.random.seed(0)
516    tf.random.set_seed(0)
517    model = tf.keras.models.Sequential([
518        tf.keras.layers.Dense(1, activation="linear")
519    ])
520    model.compile(optimizer="sgd", loss="mse")
521
522    x = np.random.uniform(size=(1,1))
523    y = np.random.uniform(size=(1,))
524    model.fit(x, y, epochs=1)
525    EOF
526  '';
527  # Regression test for #77626 removed because not more `tensorflow.contrib`.
528
529  passthru = {
530    inherit cudaPackages;
531    deps = bazel-build.deps;
532    libtensorflow = bazel-build.out;
533  };
534
535  inherit (bazel-build) meta;
536}