diff --git a/CMakeLists.txt b/CMakeLists.txt index e09972fe7199..a9fa9b293b48 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -56,8 +56,8 @@ endif() # requirements.txt files and should be kept consistent. The ROCm torch # versions are derived from docker/Dockerfile.rocm # -set(TORCH_SUPPORTED_VERSION_CUDA "2.9.0") -set(TORCH_SUPPORTED_VERSION_ROCM "2.9.0") +set(TORCH_SUPPORTED_VERSION_CUDA "2.10.0") +set(TORCH_SUPPORTED_VERSION_ROCM "2.10.0") # # Try to find python package with an executable that exactly matches @@ -426,7 +426,7 @@ if(VLLM_GPU_LANG STREQUAL "CUDA") endif() list(APPEND VLLM_EXT_SRC ${MARLIN_TEMPLATE_BF16_KERNEL_SRC}) - if (MARLIN_FP8_ARCHS) + if (MARLIN_FP8_ARCHS) file(GLOB MARLIN_TEMPLATE_FP8_KERNEL_SRC "csrc/quantization/gptq_marlin/sm89_kernel_*.cu") set_gencode_flags_for_srcs( SRCS "${MARLIN_TEMPLATE_FP8_KERNEL_SRC}" diff --git a/docker/Dockerfile b/docker/Dockerfile index 0d50d97e54c6..60a1a9bb9d86 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -55,7 +55,7 @@ ARG UV_INDEX_URL=${PIP_INDEX_URL} ARG UV_EXTRA_INDEX_URL=${PIP_EXTRA_INDEX_URL} # PyTorch provides its own indexes for standard and nightly builds -ARG PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl +ARG PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly # PIP supports multiple authentication schemes, including keyring # By parameterizing the PIP_KEYRING_PROVIDER variable and setting it to diff --git a/docker/Dockerfile.cpu b/docker/Dockerfile.cpu index 8d55ecfba3e5..a806e989f6ff 100644 --- a/docker/Dockerfile.cpu +++ b/docker/Dockerfile.cpu @@ -26,7 +26,7 @@ FROM ubuntu:22.04 AS base-common WORKDIR /workspace/ ARG PYTHON_VERSION=3.12 -ARG PIP_EXTRA_INDEX_URL="https://download.pytorch.org/whl/cpu" +ARG PIP_EXTRA_INDEX_URL="https://download.pytorch.org/whl/nightly/cpu" # Install minimal dependencies and uv RUN --mount=type=cache,target=/var/cache/apt,sharing=locked \ diff --git a/pyproject.toml b/pyproject.toml index a250ab6567f1..79b9ddc94bc5 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -6,7 +6,7 @@ requires = [ "packaging>=24.2", "setuptools>=77.0.3,<81.0.0", "setuptools-scm>=8.0", - "torch == 2.9.0", + "torch", "wheel", "jinja2", ] diff --git a/requirements/build.txt b/requirements/build.txt index 23ff8d4fdc1c..c8d09c965cd4 100644 --- a/requirements/build.txt +++ b/requirements/build.txt @@ -4,7 +4,7 @@ ninja packaging>=24.2 setuptools>=77.0.3,<81.0.0 setuptools-scm>=8 -torch==2.9.0 +torch wheel jinja2>=3.1.6 regex diff --git a/requirements/cuda.txt b/requirements/cuda.txt index 462f18ef7159..4823d44acc5a 100644 --- a/requirements/cuda.txt +++ b/requirements/cuda.txt @@ -5,9 +5,9 @@ numba == 0.61.2 # Required for N-gram speculative decoding # Dependencies for NVIDIA GPUs ray[cgraph]>=2.48.0 # Ray Compiled Graph, required for pipeline parallelism in V1. -torch==2.9.0 -torchaudio==2.9.0 +torch +torchaudio # These must be updated alongside torch -torchvision==0.24.0 # Required for phi3v processor. See https://github.com/pytorch/vision?tab=readme-ov-file#installation for corresponding version +torchvision # Required for phi3v processor. See https://github.com/pytorch/vision?tab=readme-ov-file#installation for corresponding version # FlashInfer should be updated together with the Dockerfile flashinfer-python==0.5.3 diff --git a/requirements/rocm-build.txt b/requirements/rocm-build.txt index b977e80be067..569461ef457b 100644 --- a/requirements/rocm-build.txt +++ b/requirements/rocm-build.txt @@ -1,12 +1,12 @@ # Common dependencies -r common.txt ---extra-index-url https://download.pytorch.org/whl/rocm6.4 -torch==2.9.0 -torchvision==0.24.0 -torchaudio==2.9.0 +--extra-index-url https://download.pytorch.org/whl/nightly/rocm6.4 +torch +torchvision +torchaudio -triton==3.5.0 +pytorch-triton-rocm cmake>=3.26.1,<4 packaging>=24.2 setuptools>=77.0.3,<80.0.0 diff --git a/requirements/test.in b/requirements/test.in index dfae5b75821f..e080e7d69425 100644 --- a/requirements/test.in +++ b/requirements/test.in @@ -24,9 +24,9 @@ soundfile # required for audio tests jiwer # required for audio tests tblib # for pickling test exceptions timm >=1.0.17 # required for internvl and gemma3n-mm test -torch==2.9.0 -torchaudio==2.9.0 -torchvision==0.24.0 +torch +torchaudio +torchvision transformers_stream_generator # required for qwen-vl test matplotlib # required for qwen-vl test mistral_common[image,audio] >= 1.8.5 # required for voxtral test diff --git a/requirements/test.txt b/requirements/test.txt index 571194e05c1b..aaebaaddc3cb 100644 --- a/requirements/test.txt +++ b/requirements/test.txt @@ -1123,7 +1123,7 @@ tomli==2.2.1 # via schemathesis tomli-w==1.2.0 # via schemathesis -torch==2.9.0+cu129 +torch # via # -r requirements/test.in # accelerate @@ -1152,7 +1152,7 @@ torch==2.9.0+cu129 # torchvision # vector-quantize-pytorch # vocos -torchaudio==2.9.0+cu129 +torchaudio # via # -r requirements/test.in # encodec @@ -1165,7 +1165,7 @@ torchmetrics==1.7.4 # pytorch-lightning # terratorch # torchgeo -torchvision==0.24.0+cu129 +torchvision # via # -r requirements/test.in # lightly @@ -1206,7 +1206,7 @@ transformers==4.57.3 # transformers-stream-generator transformers-stream-generator==0.0.5 # via -r requirements/test.in -triton==3.5.0 +pytorch-triton # via torch tritonclient==2.51.0 # via diff --git a/requirements/xpu.txt b/requirements/xpu.txt index c1dc4195b523..8d9d2b9a2d58 100644 --- a/requirements/xpu.txt +++ b/requirements/xpu.txt @@ -10,8 +10,8 @@ wheel jinja2>=3.1.6 datasets # for benchmark scripts numba == 0.61.2 # Required for N-gram speculative decoding ---extra-index-url=https://download.pytorch.org/whl/xpu -torch==2.9.0+xpu +--extra-index-url=https://download.pytorch.org/whl/nightly/xpu +torch torchaudio torchvision