pkgs/python-modules/moe-kernels/default.nix (66 lines of code) (raw):

{ lib, stdenv, fetchFromGitHub, buildPythonPackage, autoAddDriverRunpath, cmake, ninja, packaging, setuptools, wheel, which, cudaPackages, nvidia-ml-py, torch, }: buildPythonPackage rec { pname = "moe-kernels"; version = "0.8.2"; src = fetchFromGitHub { owner = "danieldk"; repo = pname; rev = "v${version}"; hash = "sha256-heZpJboVPGUbQgpK49YDayPm4rD/GWwbeuZNv/Byzyw="; }; stdenv = cudaPackages.backendStdenv; nativeBuildInputs = with cudaPackages; [ autoAddDriverRunpath cmake cuda_nvcc ninja which ]; build-system = [ packaging setuptools wheel ]; buildInputs = with cudaPackages; [ cuda_cccl cuda_cudart cuda_nvtx libcublas libcusolver libcusparse ]; env = { CUDA_HOME = "${lib.getDev cudaPackages.cuda_nvcc}"; TORCH_CUDA_ARCH_LIST = lib.concatStringsSep ";" torch.cudaCapabilities; }; dependencies = [ nvidia-ml-py torch ]; # cmake/ninja are used for parallel builds, but we don't want the # cmake configure hook to kick in. dontUseCmakeConfigure = true; # We don't have any tests in this package (yet). doCheck = false; pythonImportsCheck = [ "moe_kernels" ]; meta = with lib; { description = "Mixture of Experts kernels"; license = licenses.asl20; platforms = platforms.linux; }; }