Skip to content

Commit

Permalink
tensorrt-llm: 0.8.0 -> 0.9.0.dev2024040900
Browse files Browse the repository at this point in the history
tensorrtllm-backend: 0.8.0 -> 0.9.0
  • Loading branch information
yorickvP committed Apr 15, 2024
1 parent 61425ce commit 5f80297
Show file tree
Hide file tree
Showing 4 changed files with 236 additions and 135 deletions.
30 changes: 11 additions & 19 deletions default.nix
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@
let
deps = config.deps;
python3 = config.python-env.deps.python;
cudaPackages = pkgs.cudaPackages_12_2;
cudaPackages = pkgs.cudaPackages_12_1;
site = python3.sitePackages;
pythonDrvs = config.python-env.pip.drvs;
inherit (pkgs) lib;
Expand All @@ -19,16 +19,16 @@ in
python_packages = [
"--extra-index-url"
"https://pypi.nvidia.com"
"tensorrt_llm==0.8.0"
"torch==2.1.2"
"tensorrt==9.2.0.post12.dev5"
"tensorrt-bindings==9.2.0.post12.dev5"
"tensorrt-libs==9.2.0.post12.dev5"
"tensorrt_llm==0.9.0.dev2024040900"
"torch==2.2.2"
"tensorrt==9.3.0.post12.dev1"
"tensorrt-bindings==9.3.0.post12.dev1"
"tensorrt-libs==9.3.0.post12.dev1"
"nvidia-pytriton==0.5.2" # corresponds to 2.42.0
"httpx"
"nvidia-cublas-cu12<12.4"
"nvidia-cuda-nvrtc-cu12<12.4"
"nvidia-cuda-runtime-cu12<12.4"
"nvidia-cublas-cu12<12.2"
"nvidia-cuda-nvrtc-cu12<12.2"
"nvidia-cuda-runtime-cu12<12.2"
"omegaconf"
"hf-transfer"
];
Expand All @@ -49,14 +49,6 @@ in
tensorrt-bindings.public
];
tensorrt-bindings.mkDerivation.propagatedBuildInputs = [ pythonDrvs.tensorrt-libs.public ];
# fixed in torch 2.2
torch.mkDerivation.postFixup = ''
pushd $out/${site}/torch/lib
ln -s libcudart-*.so.12 libcudart.so.12
ln -s libnvrtc-*.so.12 libnvrtc.so.12
ln -s libnvToolsExt-*.so.1 libnvToolsExt.so.1
popd
'';
tensorrt-libs.mkDerivation.postFixup = ''
pushd $out/${site}/tensorrt_libs
ln -s libnvinfer.so.9 libnvinfer.so
Expand Down Expand Up @@ -122,8 +114,8 @@ in
deps.tensorrt-src = pkgs.fetchFromGitHub {
owner = "NVIDIA";
repo = "TensorRT";
rev = "93b6044fc106b69bce6751f27aa9fc198b02bddc"; # release/9.2 branch
hash = "sha256-W3ytzwq0mm40w6HZ/hArT6G7ID3HSUwzoZ8ix0Q/F6E=";
rev = "6d1397ed4bb65933d02725623c122a157544a729"; # release/9.3 branch
hash = "sha256-XWFyMD7jjvgIihlqCJNyH5iSa1vZCDhv1maLJqMM3UE=";
};
# todo: replace with lockfile
deps.pybind11-stubgen = python3.pkgs.buildPythonPackage rec {
Expand Down
Loading

0 comments on commit 5f80297

Please sign in to comment.