depot/third_party/nixpkgs/pkgs/development/python-modules/openai-triton/default.nix

{
  lib,
  config,
  buildPythonPackage,
  fetchFromGitHub,
  fetchpatch,
  addOpenGLRunpath,
  setuptools,
  pytestCheckHook,
  pythonRelaxDepsHook,
  cmake,
  ninja,
  pybind11,
  gtest,
  zlib,
  ncurses,
  libxml2,
  lit,
  llvm,
  filelock,
  torchWithRocm,
  python,

  runCommand,

  cudaPackages,
  cudaSupport ? config.cudaSupport,
}:

let
  ptxas = "${cudaPackages.cuda_nvcc}/bin/ptxas"; # Make sure cudaPackages is the right version each update (See python/setup.py)
in
buildPythonPackage rec {
  pname = "triton";
  version = "2.1.0";
  pyproject = true;

  src = fetchFromGitHub {
    owner = "openai";
    repo = pname;
    rev = "v${version}";
    hash = "sha256-8UTUwLH+SriiJnpejdrzz9qIquP2zBp1/uwLdHmv0XQ=";
  };

  patches =
    [
      # fix overflow error
      (fetchpatch {
        url = "https://github.com/openai/triton/commit/52c146f66b79b6079bcd28c55312fc6ea1852519.patch";
        hash = "sha256-098/TCQrzvrBAbQiaVGCMaF3o5Yc3yWDxzwSkzIuAtY=";
      })
    ]
    ++ lib.optionals (!cudaSupport) [
      ./0000-dont-download-ptxas.patch
      # openai-triton wants to get ptxas version even if ptxas is not
      # used, resulting in ptxas not found error.
      ./0001-ptxas-disable-version-key-for-non-cuda-targets.patch
    ];

  nativeBuildInputs = [
    setuptools
    pythonRelaxDepsHook
    # pytestCheckHook # Requires torch (circular dependency) and probably needs GPUs:
    cmake
    ninja

    # Note for future:
    # These *probably* should go in depsTargetTarget
    # ...but we cannot test cross right now anyway
    # because we only support cudaPackages on x86_64-linux atm
    lit
    llvm
  ];

  buildInputs = [
    gtest
    libxml2.dev
    ncurses
    pybind11
    zlib
  ];

  propagatedBuildInputs = [
    filelock
    # openai-triton uses setuptools at runtime:
    # https://github.com/NixOS/nixpkgs/pull/286763/#discussion_r1480392652
    setuptools
  ];

  postPatch =
    let
      # Bash was getting weird without linting,
      # but basically upstream contains [cc, ..., "-lcuda", ...]
      # and we replace it with [..., "-lcuda", "-L/run/opengl-driver/lib", "-L$stubs", ...]
      old = [ "-lcuda" ];
      new = [
        "-lcuda"
        "-L${addOpenGLRunpath.driverLink}"
        "-L${cudaPackages.cuda_cudart}/lib/stubs/"
      ];

      quote = x: ''"${x}"'';
      oldStr = lib.concatMapStringsSep ", " quote old;
      newStr = lib.concatMapStringsSep ", " quote new;
    in
    ''
      # Use our `cmakeFlags` instead and avoid downloading dependencies
      substituteInPlace python/setup.py \
        --replace "= get_thirdparty_packages(triton_cache_path)" "= os.environ[\"cmakeFlags\"].split()"

      # Already defined in llvm, when built with -DLLVM_INSTALL_UTILS
      substituteInPlace bin/CMakeLists.txt \
        --replace "add_subdirectory(FileCheck)" ""

      # Don't fetch googletest
      substituteInPlace unittest/CMakeLists.txt \
        --replace "include (\''${CMAKE_CURRENT_SOURCE_DIR}/googletest.cmake)" ""\
        --replace "include(GoogleTest)" "find_package(GTest REQUIRED)"
    ''
    + lib.optionalString cudaSupport ''
      # Use our linker flags
      substituteInPlace python/triton/common/build.py \
        --replace '${oldStr}' '${newStr}'
    '';

  # Avoid GLIBCXX mismatch with other cuda-enabled python packages
  preConfigure =
    ''
      # Ensure that the build process uses the requested number of cores
      export MAX_JOBS="$NIX_BUILD_CORES"

      # Upstream's setup.py tries to write cache somewhere in ~/
      export HOME=$(mktemp -d)

      # Upstream's github actions patch setup.cfg to write base-dir. May be redundant
      echo "
      [build_ext]
      base-dir=$PWD" >> python/setup.cfg

      # The rest (including buildPhase) is relative to ./python/
      cd python
    ''
    + lib.optionalString cudaSupport ''
      export CC=${cudaPackages.backendStdenv.cc}/bin/cc;
      export CXX=${cudaPackages.backendStdenv.cc}/bin/c++;

      # Work around download_and_copy_ptxas()
      mkdir -p $PWD/triton/third_party/cuda/bin
      ln -s ${ptxas} $PWD/triton/third_party/cuda/bin
    '';

  # CMake is run by setup.py instead
  dontUseCmakeConfigure = true;

  # Setuptools (?) strips runpath and +x flags. Let's just restore the symlink
  postFixup = lib.optionalString cudaSupport ''
    rm -f $out/${python.sitePackages}/triton/third_party/cuda/bin/ptxas
    ln -s ${ptxas} $out/${python.sitePackages}/triton/third_party/cuda/bin/ptxas
  '';

  checkInputs = [ cmake ]; # ctest
  dontUseSetuptoolsCheck = true;

  preCheck = ''
    # build/temp* refers to build_ext.build_temp (looked up in the build logs)
    (cd /build/source/python/build/temp* ; ctest)

    # For pytestCheckHook
    cd test/unit
  '';

  # Circular dependency on torch
  # pythonImportsCheck = [
  #   "triton"
  #   "triton.language"
  # ];

  # Ultimately, torch is our test suite:
  passthru.tests = {
    inherit torchWithRocm;
    # Implemented as alternative to pythonImportsCheck, in case if circular dependency on torch occurs again,
    # and pythonImportsCheck is commented back.
    import-triton =
      runCommand "import-triton"
        { nativeBuildInputs = [ (python.withPackages (ps: [ ps.openai-triton ])) ]; }
        ''
          python << \EOF
          import triton
          import triton.language
          EOF
          touch "$out"
        '';
  };

  pythonRemoveDeps = [
    # Circular dependency, cf. https://github.com/openai/triton/issues/1374
    "torch"

    # CLI tools without dist-info
    "cmake"
    "lit"
  ];

  meta = with lib; {
    description = "Language and compiler for writing highly efficient custom Deep-Learning primitives";
    homepage = "https://github.com/openai/triton";
    platforms = platforms.linux;
    license = licenses.mit;
    maintainers = with maintainers; [
      SomeoneSerge
      Madouura
    ];
  };
}
Project import generated by Copybara. GitOrigin-RevId: e8057b67ebf307f01bdcc8fba94d94f75039d1f6 2024-06-05 15:53:02 +00:00			`{`
			`lib,`
			`config,`
			`buildPythonPackage,`
			`fetchFromGitHub,`
			`fetchpatch,`
			`addOpenGLRunpath,`
			`setuptools,`
			`pytestCheckHook,`
			`pythonRelaxDepsHook,`
			`cmake,`
			`ninja,`
			`pybind11,`
			`gtest,`
			`zlib,`
			`ncurses,`
			`libxml2,`
			`lit,`
			`llvm,`
			`filelock,`
			`torchWithRocm,`
			`python,`

			`runCommand,`

			`cudaPackages,`
			`cudaSupport ? config.cudaSupport,`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`}:`

			`let`
Project import generated by Copybara. GitOrigin-RevId: bd645e8668ec6612439a9ee7e71f7eac4099d4f6 2024-01-02 11:29:13 +00:00			`ptxas = "${cudaPackages.cuda_nvcc}/bin/ptxas"; # Make sure cudaPackages is the right version each update (See python/setup.py)`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`in`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00			`buildPythonPackage rec {`
			`pname = "triton";`
Project import generated by Copybara. GitOrigin-RevId: bd645e8668ec6612439a9ee7e71f7eac4099d4f6 2024-01-02 11:29:13 +00:00			`version = "2.1.0";`
			`pyproject = true;`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00
			`src = fetchFromGitHub {`
			`owner = "openai";`
			`repo = pname;`
			`rev = "v${version}";`
Project import generated by Copybara. GitOrigin-RevId: bd645e8668ec6612439a9ee7e71f7eac4099d4f6 2024-01-02 11:29:13 +00:00			`hash = "sha256-8UTUwLH+SriiJnpejdrzz9qIquP2zBp1/uwLdHmv0XQ=";`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`};`

Project import generated by Copybara. GitOrigin-RevId: e8057b67ebf307f01bdcc8fba94d94f75039d1f6 2024-06-05 15:53:02 +00:00			`patches =`
			`[`
			`# fix overflow error`
			`(fetchpatch {`
			`url = "https://github.com/openai/triton/commit/52c146f66b79b6079bcd28c55312fc6ea1852519.patch";`
			`hash = "sha256-098/TCQrzvrBAbQiaVGCMaF3o5Yc3yWDxzwSkzIuAtY=";`
			`})`
			`]`
			`++ lib.optionals (!cudaSupport) [`
			`./0000-dont-download-ptxas.patch`
			`# openai-triton wants to get ptxas version even if ptxas is not`
			`# used, resulting in ptxas not found error.`
			`./0001-ptxas-disable-version-key-for-non-cuda-targets.patch`
			`];`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00
			`nativeBuildInputs = [`
Project import generated by Copybara. GitOrigin-RevId: bd645e8668ec6612439a9ee7e71f7eac4099d4f6 2024-01-02 11:29:13 +00:00			`setuptools`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`pythonRelaxDepsHook`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00			`# pytestCheckHook # Requires torch (circular dependency) and probably needs GPUs:`
			`cmake`
			`ninja`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00
			`# Note for future:`
			`# These probably should go in depsTargetTarget`
			`# ...but we cannot test cross right now anyway`
			`# because we only support cudaPackages on x86_64-linux atm`
			`lit`
			`llvm`
			`];`

			`buildInputs = [`
			`gtest`
			`libxml2.dev`
			`ncurses`
			`pybind11`
			`zlib`
			`];`

Project import generated by Copybara. GitOrigin-RevId: 1536926ef5621b09bba54035ae2bb6d806d72ac8 2024-02-29 20:09:43 +00:00			`propagatedBuildInputs = [`
			`filelock`
			`# openai-triton uses setuptools at runtime:`
			`# https://github.com/NixOS/nixpkgs/pull/286763/#discussion_r1480392652`
			`setuptools`
			`];`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00
Project import generated by Copybara. GitOrigin-RevId: e8057b67ebf307f01bdcc8fba94d94f75039d1f6 2024-06-05 15:53:02 +00:00			`postPatch =`
			`let`
			`# Bash was getting weird without linting,`
			`# but basically upstream contains [cc, ..., "-lcuda", ...]`
			`# and we replace it with [..., "-lcuda", "-L/run/opengl-driver/lib", "-L$stubs", ...]`
			`old = [ "-lcuda" ];`
			`new = [`
			`"-lcuda"`
			`"-L${addOpenGLRunpath.driverLink}"`
			`"-L${cudaPackages.cuda_cudart}/lib/stubs/"`
			`];`

			`quote = x: ''"${x}"'';`
			`oldStr = lib.concatMapStringsSep ", " quote old;`
			`newStr = lib.concatMapStringsSep ", " quote new;`
			`in`
			`''`
			# Use our `cmakeFlags` instead and avoid downloading dependencies
			`substituteInPlace python/setup.py \`
			`--replace "= get_thirdparty_packages(triton_cache_path)" "= os.environ[\"cmakeFlags\"].split()"`

			`# Already defined in llvm, when built with -DLLVM_INSTALL_UTILS`
			`substituteInPlace bin/CMakeLists.txt \`
			`--replace "add_subdirectory(FileCheck)" ""`

			`# Don't fetch googletest`
			`substituteInPlace unittest/CMakeLists.txt \`
			`--replace "include (\''${CMAKE_CURRENT_SOURCE_DIR}/googletest.cmake)" ""\`
			`--replace "include(GoogleTest)" "find_package(GTest REQUIRED)"`
			`''`
			`+ lib.optionalString cudaSupport ''`
			`# Use our linker flags`
			`substituteInPlace python/triton/common/build.py \`
			`--replace '${oldStr}' '${newStr}'`
			`'';`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00
			`# Avoid GLIBCXX mismatch with other cuda-enabled python packages`
Project import generated by Copybara. GitOrigin-RevId: e8057b67ebf307f01bdcc8fba94d94f75039d1f6 2024-06-05 15:53:02 +00:00			`preConfigure =`
			`''`
			`# Ensure that the build process uses the requested number of cores`
			`export MAX_JOBS="$NIX_BUILD_CORES"`

			`# Upstream's setup.py tries to write cache somewhere in ~/`
			`export HOME=$(mktemp -d)`

			`# Upstream's github actions patch setup.cfg to write base-dir. May be redundant`
			`echo "`
			`[build_ext]`
			`base-dir=$PWD" >> python/setup.cfg`

			`# The rest (including buildPhase) is relative to ./python/`
			`cd python`
			`''`
			`+ lib.optionalString cudaSupport ''`
			`export CC=${cudaPackages.backendStdenv.cc}/bin/cc;`
			`export CXX=${cudaPackages.backendStdenv.cc}/bin/c++;`

			`# Work around download_and_copy_ptxas()`
			`mkdir -p $PWD/triton/third_party/cuda/bin`
			`ln -s ${ptxas} $PWD/triton/third_party/cuda/bin`
			`'';`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00
			`# CMake is run by setup.py instead`
			`dontUseCmakeConfigure = true;`

Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00			`# Setuptools (?) strips runpath and +x flags. Let's just restore the symlink`
Project import generated by Copybara. GitOrigin-RevId: c757e9bd77b16ca2e03c89bf8bc9ecb28e0c06ad 2023-11-16 04:20:00 +00:00			`postFixup = lib.optionalString cudaSupport ''`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00			`rm -f $out/${python.sitePackages}/triton/third_party/cuda/bin/ptxas`
			`ln -s ${ptxas} $out/${python.sitePackages}/triton/third_party/cuda/bin/ptxas`
			`'';`

			`checkInputs = [ cmake ]; # ctest`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`dontUseSetuptoolsCheck = true;`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00
			`preCheck = ''`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`# build/temp* refers to build_ext.build_temp (looked up in the build logs)`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00			`(cd /build/source/python/build/temp* ; ctest)`

			`# For pytestCheckHook`
			`cd test/unit`
			`'';`

			`# Circular dependency on torch`
			`# pythonImportsCheck = [`
			`# "triton"`
			`# "triton.language"`
			`# ];`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00
			`# Ultimately, torch is our test suite:`
Project import generated by Copybara. GitOrigin-RevId: 1536926ef5621b09bba54035ae2bb6d806d72ac8 2024-02-29 20:09:43 +00:00			`passthru.tests = {`
			`inherit torchWithRocm;`
			`# Implemented as alternative to pythonImportsCheck, in case if circular dependency on torch occurs again,`
			`# and pythonImportsCheck is commented back.`
Project import generated by Copybara. GitOrigin-RevId: e8057b67ebf307f01bdcc8fba94d94f75039d1f6 2024-06-05 15:53:02 +00:00			`import-triton =`
			`runCommand "import-triton"`
			`{ nativeBuildInputs = [ (python.withPackages (ps: [ ps.openai-triton ])) ]; }`
			`''`
			`python << \EOF`
			`import triton`
			`import triton.language`
			`EOF`
			`touch "$out"`
			`'';`
Project import generated by Copybara. GitOrigin-RevId: 1536926ef5621b09bba54035ae2bb6d806d72ac8 2024-02-29 20:09:43 +00:00			`};`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00
			`pythonRemoveDeps = [`
			`# Circular dependency, cf. https://github.com/openai/triton/issues/1374`
			`"torch"`

			`# CLI tools without dist-info`
			`"cmake"`
			`"lit"`
			`];`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`meta = with lib; {`
Project import generated by Copybara. GitOrigin-RevId: 7c9cc5a6e5d38010801741ac830a3f8fd667a7a0 2023-10-19 13:55:26 +00:00			`description = "Language and compiler for writing highly efficient custom Deep-Learning primitives";`
			`homepage = "https://github.com/openai/triton";`
Project import generated by Copybara. GitOrigin-RevId: 33d1e753c82ffc557b4a585c77de43d4c922ebb5 2024-05-15 15:35:15 +00:00			`platforms = platforms.linux;`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`license = licenses.mit;`
Project import generated by Copybara. GitOrigin-RevId: e8057b67ebf307f01bdcc8fba94d94f75039d1f6 2024-06-05 15:53:02 +00:00			`maintainers = with maintainers; [`
			`SomeoneSerge`
			`Madouura`
			`];`
Project import generated by Copybara. GitOrigin-RevId: fe2ecaf706a5907b5e54d979fbde4924d84b65fc 2023-04-12 12:48:02 +00:00			`};`
			`}`