diff --git a/Cargo.lock b/Cargo.lock index 76196e53e4..9e9de8d366 100644 --- a/Cargo.lock +++ b/Cargo.lock @@ -5117,9 +5117,9 @@ dependencies = [ [[package]] name = "nixl-sys" -version = "0.6.0" +version = "0.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "06b070d86389c00f5144bc0f7a456913212c25fa4e4713c482f2f0bfa0839ee2" +checksum = "a73b92494c94b2ff2d004cd9274d966863089e867dc9cd98bc640aefe7622036" dependencies = [ "bindgen 0.71.1", "cc", diff --git a/container/Dockerfile b/container/Dockerfile index 0d509fe572..4aeaa61c76 100644 --- a/container/Dockerfile +++ b/container/Dockerfile @@ -38,7 +38,7 @@ ARG SCCACHE_REGION="" # NIXL configuration ARG NIXL_UCX_REF=v1.19.0 -ARG NIXL_REF=0.6.0 +ARG NIXL_REF=0.7.0 # Python configuration ARG PYTHON_VERSION=3.12 diff --git a/container/build.sh b/container/build.sh index 373f4abf33..452283aef2 100755 --- a/container/build.sh +++ b/container/build.sh @@ -115,7 +115,7 @@ NONE_BASE_IMAGE_TAG="25.01-cuda12.8-devel-ubuntu24.04" SGLANG_BASE_IMAGE="nvcr.io/nvidia/cuda-dl-base" SGLANG_BASE_IMAGE_TAG="25.01-cuda12.8-devel-ubuntu24.04" -NIXL_REF=0.6.0 +NIXL_REF=0.7.0 NIXL_UCX_REF=v1.19.0 NIXL_UCX_EFA_REF=9d2b88a1f67faf9876f267658bd077b379b8bb76 diff --git a/docs/reference/support-matrix.md b/docs/reference/support-matrix.md index 4b6104b524..2b7b2945be 100644 --- a/docs/reference/support-matrix.md +++ b/docs/reference/support-matrix.md @@ -58,14 +58,14 @@ If you are using a **GPU**, the following GPU models and architectures are suppo | :----------------- | :---------- | :------------------------------------ | :----------- | | ai-dynamo | 0.6.1 | >=2.28 | | | ai-dynamo-runtime | 0.6.1 | >=2.28 (Python 3.12 has known issues) | | -| NIXL | 0.6.0 | >=2.27 | >=11.8 | +| NIXL | 0.7.0 | >=2.27 | >=11.8 | ### Build Dependency | **Build Dependency** | **Version** | | :------------------- | :------------------------------------------------------------------------------- | | **TensorRT-LLM** | 1.1.0rc5 | -| **NIXL** | 0.6.0 | +| **NIXL** | 0.7.0 | | **vLLM** | 0.10.1.1 | | **SGLang** | 0.5.3rc0 | diff --git a/lib/bindings/python/Cargo.lock b/lib/bindings/python/Cargo.lock index c3f4f33b2a..b671326c54 100644 --- a/lib/bindings/python/Cargo.lock +++ b/lib/bindings/python/Cargo.lock @@ -3667,9 +3667,9 @@ dependencies = [ [[package]] name = "nixl-sys" -version = "0.6.0" +version = "0.7.0" source = "registry+https://github.com/rust-lang/crates.io-index" -checksum = "06b070d86389c00f5144bc0f7a456913212c25fa4e4713c482f2f0bfa0839ee2" +checksum = "a73b92494c94b2ff2d004cd9274d966863089e867dc9cd98bc640aefe7622036" dependencies = [ "bindgen 0.71.1", "cc", diff --git a/lib/llm/Cargo.toml b/lib/llm/Cargo.toml index cebf062be6..d045152ac9 100644 --- a/lib/llm/Cargo.toml +++ b/lib/llm/Cargo.toml @@ -95,7 +95,7 @@ dialoguer = { version = "0.11", default-features = false, features = [ # block_manager aligned-vec = { version = "0.6.4", optional = true } -nixl-sys = { version = "=0.6.0", optional = true } +nixl-sys = { version = "=0.7.0", optional = true } cudarc = { workspace = true, optional = true } ndarray = { version = "0.16", optional = true } nix = { version = "0.26", optional = true } diff --git a/pyproject.toml b/pyproject.toml index e67f68973f..2455de4b66 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -54,13 +54,13 @@ trtllm =[ vllm = [ "uvloop", - "nixl<=0.6.0", + "nixl<=0.7.0", "vllm[flashinfer]==0.10.2", ] sglang = [ "uvloop", - "nixl<=0.6.0", + "nixl<=0.7.0", "sglang[all]==0.5.4.post1", ]