NVIDIA-NeMo · terrykong · Feb 3, 2026 · Feb 4, 2026
@@ -19,10 +19,10 @@ dependencies = [
   "setuptools",
   "pip",                                                                                                              # Required for frozen environments; uv venv --seed may not reliably install pip
   "ninja",                                                                                                            # for flash-attn parallel build
-  "torch==2.9.0",
+  "torch==2.9.1",
   "triton; sys_platform == 'linux' and (platform_machine == 'x86_64' or platform_machine == 'aarch64')",
   "colored==2.2.3",
-  "ray[default]==2.49.2",
+  "ray[default]==2.53.0",
   "transformers==4.57.1",
   "wandb",
   "numpy",
@@ -76,18 +76,17 @@ vllm = [
   # sudo apt-get update
   # sudo apt-get install libibverbs-dev
   "deep_ep @ git+https://github.com/deepseek-ai/DeepEP.git@bfded34800dfec415b71503f8205181de90b2480",
-  "vllm==0.11.2",
+  "vllm==0.15.0",
   "num2words>=0.5.14",
 ]
 sglang = [
-  "sglang==0.5.7",
+  "sglang==0.5.8",
   "orjson",
   "uvloop",
   "requests",
   "openai",
   "partial-json-parser",
   "sentencepiece",
-  "sgl-kernel",
   "compressed-tensors",
   "msgspec",
   "python-multipart",
@@ -124,7 +123,7 @@ nemo_gym = ["nemo_gym"]
 # This is a default group so that we install these even with bare `uv sync`
 build = [
   # Build requirement for TE
-  "torch==2.9.0",
+  "torch==2.9.1",
   # Build requirement for TE
   "setuptools",
   "packaging",
@@ -186,7 +185,6 @@ triton = [
 causal-conv1d = { git = "https://github.com/Dao-AILab/causal-conv1d", rev = "67e0a9dfe1518fc0036444e9ab5fe06ab78299e0" }
 mamba-ssm = { git = "https://github.com/state-spaces/mamba.git", rev = "d68d16ed7d5d5164eb5a57c0285f3b7eb8394ec1" }
 nv-grouped-gemm = { git = "https://github.com/fanshiqing/grouped_gemm", tag = "v1.1.4.post7" }
-sgl-kernel = { git = "https://github.com/sgl-project/sglang", tag = "v0.5.7", subdirectory = "sgl-kernel" }
 
 [tool.uv.workspace]
 members = [
@@ -224,7 +222,6 @@ no-build-isolation-package = [
   "deep_gemm",
   "deep_ep",
   "nv-grouped-gemm",          # from mlm (added here to make sure it's built no isolation since mlm workspace uses setup.py)
-  "sgl-kernel",
 ]
 # Always apply the build group since dependencies like TE/mcore/nemo-run require build dependencies
 # and this lets us assume they are implicitly installed with a simply `uv sync`. Ideally, we'd
@@ -244,9 +241,8 @@ override-dependencies = [
   "opencv-python-headless>=4.11.0",
   "timm<=1.0.22",
   "nvidia-modelopt[torch]>=0.39.0",
-  # sglang requires torch 2.9.1, but we need 2.9.0
-  "torch==2.9.0",
-  "torchaudio==2.9.0",
+  "torch==2.9.1",
+  "torchaudio==2.9.1",
   # sglang has conflicting llguidance versions than vllm, so enforcing vllm's version since it's newer
   "llguidance>=1.3.0,<1.4.0",
   # Override setuptools range in other dependencies to address CVE GHSA-58pv-8j8x-9vj2
@@ -295,7 +291,7 @@ transformer-engine-torch = [{ requirement = "torch", match-runtime = true }]
 mamba-ssm = [{ requirement = "torch", match-runtime = true }]
 causal-conv1d = [{ requirement = "torch", match-runtime = true }]
 nv-grouped-gemm = [{ requirement = "torch", match-runtime = true }]
-sgl-kernel = [{ requirement = "torch", match-runtime = true }]
+#sgl-kernel = [{ requirement = "torch", match-runtime = true }]
 
 # Needed when building from source
 [[tool.uv.dependency-metadata]]
@@ -332,11 +328,11 @@ name = "nv-grouped-gemm"
 version = "v1.1.4.post7"
 requires-dist = ["setuptools", "wheel", "torch", "numpy"]
 
-[[tool.uv.dependency-metadata]]
-name = "sgl-kernel"
-# This version has to match the version in the commit/rev/tag used
-version = "0.3.20"
-requires-dist = ["torch", "scikit-build-core", "wheel"]
+#[[tool.uv.dependency-metadata]]
+#name = "sgl-kernel"
+## This version has to match the version in the commit/rev/tag used
+#version = "0.3.20"
+#requires-dist = ["torch", "scikit-build-core", "wheel"]
 
 [tool.black]
 line-length = 120

@@ -25,7 +25,7 @@ GIT_REF=${2:-cc99baf14dacc2497d0c5ed84e076ef2c37f6a4d}
 # NOTE: VLLM_USE_PRECOMPILED=1 didn't always seem to work since the wheels were sometimes built against an incompatible torch/cuda combo.
 # This commit was chosen as one close to the v0.10 release: git merge-base --fork-point origin/main tags/v0.10.0
 VLLM_WHEEL_COMMIT=${3:-862f2ef893d9751db0a92bd2d4ae0e3d9677872f}  # use full commit hash from the main branch
-export VLLM_PRECOMPILED_WHEEL_LOCATION="https://wheels.vllm.ai/${VLLM_WHEEL_COMMIT}/vllm-1.0.0.dev-cp38-abi3-manylinux1_x86_64.whl"
+export VLLM_PRECOMPILED_WHEEL_LOCATION="https://wheels.vllm.ai/${VLLM_WHEEL_COMMIT}/vllm-1.0.0.dev-cp38-abi3-manylinux1_$(uname -m).whl"
 
 BUILD_DIR=$(realpath "$SCRIPT_DIR/../3rdparty/vllm")
 if [[ -e "$BUILD_DIR" ]]; then
@@ -60,15 +60,15 @@ find requirements/ -name "*.txt" -type f -exec sed -i 's/#.*$//' {} \; 2>/dev/nu
 find requirements/ -name "*.txt" -type f -exec sed -i '/^[[:space:]]*$/d' {} \; 2>/dev/null || true
 # Replace xformers==.* (but preserve any platform markers at the end)
 # NOTE: that xformers is bumped from 0.0.30 to 0.0.31 to work with torch==2.7.1. This version may need to change to change when we upgrade torch.
-find requirements/ -name "*.txt" -type f -exec sed -i -E 's/^(xformers)==[^;[:space:]]*/\1==0.0.32.post1/' {} \; 2>/dev/null || true
+#find requirements/ -name "*.txt" -type f -exec sed -i -E 's/^(xformers)==[^;[:space:]]*/\1==0.0.32.post1/' {} \; 2>/dev/null || true
 
 uv run --no-project use_existing_torch.py
 
 # Install dependencies
 echo "Installing dependencies..."
 uv pip install --upgrade pip
 uv pip install numpy setuptools setuptools_scm
-uv pip install torch==2.9.0 --torch-backend=cu129
+uv pip install torch==2.9.1 --torch-backend=cu129
 
 # Install vLLM using precompiled wheel
 echo "Installing vLLM with precompiled wheel..."