Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
30 changes: 13 additions & 17 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -19,10 +19,10 @@ dependencies = [
"setuptools",
"pip", # Required for frozen environments; uv venv --seed may not reliably install pip
"ninja", # for flash-attn parallel build
"torch==2.9.0",
"torch==2.9.1",
"triton; sys_platform == 'linux' and (platform_machine == 'x86_64' or platform_machine == 'aarch64')",
"colored==2.2.3",
"ray[default]==2.49.2",
"ray[default]==2.53.0",
"transformers==4.57.1",
"wandb",
"numpy",
Expand Down Expand Up @@ -76,18 +76,17 @@ vllm = [
# sudo apt-get update
# sudo apt-get install libibverbs-dev
"deep_ep @ git+https://github.com/deepseek-ai/DeepEP.git@bfded34800dfec415b71503f8205181de90b2480",
"vllm==0.11.2",
"vllm==0.15.0",
"num2words>=0.5.14",
]
sglang = [
"sglang==0.5.7",
"sglang==0.5.8",
"orjson",
"uvloop",
"requests",
"openai",
"partial-json-parser",
"sentencepiece",
"sgl-kernel",
"compressed-tensors",
"msgspec",
"python-multipart",
Expand Down Expand Up @@ -124,7 +123,7 @@ nemo_gym = ["nemo_gym"]
# This is a default group so that we install these even with bare `uv sync`
build = [
# Build requirement for TE
"torch==2.9.0",
"torch==2.9.1",
# Build requirement for TE
"setuptools",
"packaging",
Expand Down Expand Up @@ -186,7 +185,6 @@ triton = [
causal-conv1d = { git = "https://github.com/Dao-AILab/causal-conv1d", rev = "67e0a9dfe1518fc0036444e9ab5fe06ab78299e0" }
mamba-ssm = { git = "https://github.com/state-spaces/mamba.git", rev = "d68d16ed7d5d5164eb5a57c0285f3b7eb8394ec1" }
nv-grouped-gemm = { git = "https://github.com/fanshiqing/grouped_gemm", tag = "v1.1.4.post7" }
sgl-kernel = { git = "https://github.com/sgl-project/sglang", tag = "v0.5.7", subdirectory = "sgl-kernel" }

[tool.uv.workspace]
members = [
Expand Down Expand Up @@ -224,7 +222,6 @@ no-build-isolation-package = [
"deep_gemm",
"deep_ep",
"nv-grouped-gemm", # from mlm (added here to make sure it's built no isolation since mlm workspace uses setup.py)
"sgl-kernel",
]
# Always apply the build group since dependencies like TE/mcore/nemo-run require build dependencies
# and this lets us assume they are implicitly installed with a simply `uv sync`. Ideally, we'd
Expand All @@ -244,9 +241,8 @@ override-dependencies = [
"opencv-python-headless>=4.11.0",
"timm<=1.0.22",
"nvidia-modelopt[torch]>=0.39.0",
# sglang requires torch 2.9.1, but we need 2.9.0
"torch==2.9.0",
"torchaudio==2.9.0",
"torch==2.9.1",
"torchaudio==2.9.1",
# sglang has conflicting llguidance versions than vllm, so enforcing vllm's version since it's newer
"llguidance>=1.3.0,<1.4.0",
# Override setuptools range in other dependencies to address CVE GHSA-58pv-8j8x-9vj2
Expand Down Expand Up @@ -295,7 +291,7 @@ transformer-engine-torch = [{ requirement = "torch", match-runtime = true }]
mamba-ssm = [{ requirement = "torch", match-runtime = true }]
causal-conv1d = [{ requirement = "torch", match-runtime = true }]
nv-grouped-gemm = [{ requirement = "torch", match-runtime = true }]
sgl-kernel = [{ requirement = "torch", match-runtime = true }]
#sgl-kernel = [{ requirement = "torch", match-runtime = true }]

# Needed when building from source
[[tool.uv.dependency-metadata]]
Expand Down Expand Up @@ -332,11 +328,11 @@ name = "nv-grouped-gemm"
version = "v1.1.4.post7"
requires-dist = ["setuptools", "wheel", "torch", "numpy"]

[[tool.uv.dependency-metadata]]
name = "sgl-kernel"
# This version has to match the version in the commit/rev/tag used
version = "0.3.20"
requires-dist = ["torch", "scikit-build-core", "wheel"]
#[[tool.uv.dependency-metadata]]
#name = "sgl-kernel"
## This version has to match the version in the commit/rev/tag used
#version = "0.3.20"
#requires-dist = ["torch", "scikit-build-core", "wheel"]

[tool.black]
line-length = 120
Expand Down
6 changes: 3 additions & 3 deletions tools/build-custom-vllm.sh
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@ GIT_REF=${2:-cc99baf14dacc2497d0c5ed84e076ef2c37f6a4d}
# NOTE: VLLM_USE_PRECOMPILED=1 didn't always seem to work since the wheels were sometimes built against an incompatible torch/cuda combo.
# This commit was chosen as one close to the v0.10 release: git merge-base --fork-point origin/main tags/v0.10.0
VLLM_WHEEL_COMMIT=${3:-862f2ef893d9751db0a92bd2d4ae0e3d9677872f} # use full commit hash from the main branch
export VLLM_PRECOMPILED_WHEEL_LOCATION="https://wheels.vllm.ai/${VLLM_WHEEL_COMMIT}/vllm-1.0.0.dev-cp38-abi3-manylinux1_x86_64.whl"
export VLLM_PRECOMPILED_WHEEL_LOCATION="https://wheels.vllm.ai/${VLLM_WHEEL_COMMIT}/vllm-1.0.0.dev-cp38-abi3-manylinux1_$(uname -m).whl"

BUILD_DIR=$(realpath "$SCRIPT_DIR/../3rdparty/vllm")
if [[ -e "$BUILD_DIR" ]]; then
Expand Down Expand Up @@ -60,15 +60,15 @@ find requirements/ -name "*.txt" -type f -exec sed -i 's/#.*$//' {} \; 2>/dev/nu
find requirements/ -name "*.txt" -type f -exec sed -i '/^[[:space:]]*$/d' {} \; 2>/dev/null || true
# Replace xformers==.* (but preserve any platform markers at the end)
# NOTE: that xformers is bumped from 0.0.30 to 0.0.31 to work with torch==2.7.1. This version may need to change to change when we upgrade torch.
find requirements/ -name "*.txt" -type f -exec sed -i -E 's/^(xformers)==[^;[:space:]]*/\1==0.0.32.post1/' {} \; 2>/dev/null || true
#find requirements/ -name "*.txt" -type f -exec sed -i -E 's/^(xformers)==[^;[:space:]]*/\1==0.0.32.post1/' {} \; 2>/dev/null || true

uv run --no-project use_existing_torch.py

# Install dependencies
echo "Installing dependencies..."
uv pip install --upgrade pip
uv pip install numpy setuptools setuptools_scm
uv pip install torch==2.9.0 --torch-backend=cu129
uv pip install torch==2.9.1 --torch-backend=cu129

# Install vLLM using precompiled wheel
echo "Installing vLLM with precompiled wheel..."
Expand Down
Loading
Loading