tangled
alpha
login
or
join now
tjh.dev
/
nixpkgs
0
fork
atom
nixpkgs mirror (for testing)
github.com/NixOS/nixpkgs
nix
0
fork
atom
overview
issues
pulls
pipelines
python312Packages.vllm: 0.9.0.1 -> 0.9.1
Conroy Cheers
10 months ago
e58aa1c6
5b0471b7
+51
-29
2 changed files
expand all
collapse all
unified
split
pkgs
development
python-modules
vllm
0005-drop-intel-reqs.patch
default.nix
+17
-4
pkgs/development/python-modules/vllm/0005-drop-intel-reqs.patch
reviewed
···
1
1
+
From 7511784ceb9252091a9d63ac6b54dcc67dd2b262 Mon Sep 17 00:00:00 2001
2
2
+
From: Conroy Cheers <conroy@corncheese.org>
3
3
+
Date: Fri, 13 Jun 2025 17:42:10 +1000
4
4
+
Subject: [PATCH] drop intel reqs
5
5
+
6
6
+
---
7
7
+
requirements/cpu.txt | 3 ---
8
8
+
1 file changed, 3 deletions(-)
9
9
+
1
10
diff --git a/requirements/cpu.txt b/requirements/cpu.txt
2
2
-
index 121330158..d41918883 100644
11
11
+
index d7b0fc6d8..be2df751b 100644
3
12
--- a/requirements/cpu.txt
4
13
+++ b/requirements/cpu.txt
5
5
-
@@ -20,7 +20,3 @@ datasets # for benchmark scripts
6
6
-
14
14
+
@@ -24,8 +24,5 @@ datasets # for benchmark scripts
7
15
# cpu cannot use triton 3.3.0
8
16
triton==3.2.0; platform_machine == "x86_64"
9
9
-
-
17
17
+
10
18
-# Intel Extension for PyTorch, only for x86_64 CPUs
11
19
-intel-openmp==2024.2.1; platform_machine == "x86_64"
12
20
-intel_extension_for_pytorch==2.7.0; platform_machine == "x86_64"
21
21
+
py-libnuma; platform_system != "Darwin"
22
22
+
psutil; platform_system != "Darwin"
23
23
+
--
24
24
+
2.49.0
25
25
+
+34
-25
pkgs/development/python-modules/vllm/default.nix
reviewed
···
3
3
stdenv,
4
4
python,
5
5
buildPythonPackage,
6
6
+
pythonAtLeast,
6
7
fetchFromGitHub,
7
8
fetchpatch,
8
9
symlinkJoin,
···
68
67
opentelemetry-exporter-otlp,
69
68
bitsandbytes,
70
69
flashinfer,
70
70
+
py-libnuma,
71
71
72
72
# internal dependency - for overriding in overlays
73
73
vllm-flash-attn ? null,
···
248
246
249
247
buildPythonPackage rec {
250
248
pname = "vllm";
251
251
-
version = "0.9.0.1";
249
249
+
version = "0.9.1";
252
250
pyproject = true;
251
251
+
252
252
+
# https://github.com/vllm-project/vllm/issues/12083
253
253
+
disabled = pythonAtLeast "3.13";
253
254
254
255
stdenv = torch.stdenv;
255
256
···
260
255
owner = "vllm-project";
261
256
repo = "vllm";
262
257
tag = "v${version}";
263
263
-
hash = "sha256-gNe/kdsDQno8Fd6mo29feWmbyC0c2+kljlVxY4v7R9U=";
258
258
+
hash = "sha256-sp7rDpewTPXTVRBJHJMj+8pJDS6wAu0/OTJZwbPPqKc=";
264
259
};
265
260
266
261
patches = [
···
269
264
url = "https://github.com/vllm-project/vllm/commit/6a5d7e45f52c3a13de43b8b4fa9033e3b342ebd2.patch";
270
265
hash = "sha256-KYthqu+6XwsYYd80PtfrMMjuRV9+ionccr7EbjE4jJE=";
271
266
})
267
267
+
(fetchpatch {
268
268
+
name = "fall-back-to-gloo-when-nccl-unavailable.patch";
269
269
+
url = "https://github.com/vllm-project/vllm/commit/aa131a94410683b0a02e74fed2ce95e6c2b6b030.patch";
270
270
+
hash = "sha256-jNlQZQ8xiW85JWyBjsPZ6FoRQsiG1J8bwzmQjnaWFBg=";
271
271
+
})
272
272
./0002-setup.py-nix-support-respect-cmakeFlags.patch
273
273
./0003-propagate-pythonpath.patch
274
274
./0004-drop-lsmod.patch
275
275
./0005-drop-intel-reqs.patch
276
276
];
277
277
278
278
-
postPatch =
279
279
-
''
280
280
-
# pythonRelaxDeps does not cover build-system
281
281
-
substituteInPlace pyproject.toml \
282
282
-
--replace-fail "torch ==" "torch >="
278
278
+
postPatch = ''
279
279
+
# pythonRelaxDeps does not cover build-system
280
280
+
substituteInPlace pyproject.toml \
281
281
+
--replace-fail "torch ==" "torch >="
283
282
284
284
-
# Ignore the python version check because it hard-codes minor versions and
285
285
-
# lags behind `ray`'s python interpreter support
286
286
-
substituteInPlace CMakeLists.txt \
287
287
-
--replace-fail \
288
288
-
'set(PYTHON_SUPPORTED_VERSIONS' \
289
289
-
'set(PYTHON_SUPPORTED_VERSIONS "${lib.versions.majorMinor python.version}"'
283
283
+
# Ignore the python version check because it hard-codes minor versions and
284
284
+
# lags behind `ray`'s python interpreter support
285
285
+
substituteInPlace CMakeLists.txt \
286
286
+
--replace-fail \
287
287
+
'set(PYTHON_SUPPORTED_VERSIONS' \
288
288
+
'set(PYTHON_SUPPORTED_VERSIONS "${lib.versions.majorMinor python.version}"'
290
289
291
291
-
# Pass build environment PYTHONPATH to vLLM's Python configuration scripts
292
292
-
substituteInPlace CMakeLists.txt \
293
293
-
--replace-fail '$PYTHONPATH' '$ENV{PYTHONPATH}'
294
294
-
''
295
295
-
+ lib.optionalString (nccl == null) ''
296
296
-
# On platforms where NCCL is not supported (e.g. Jetson), substitute Gloo (provided by Torch)
297
297
-
substituteInPlace vllm/distributed/parallel_state.py \
298
298
-
--replace-fail '"nccl"' '"gloo"'
299
299
-
'';
290
290
+
# Pass build environment PYTHONPATH to vLLM's Python configuration scripts
291
291
+
substituteInPlace CMakeLists.txt \
292
292
+
--replace-fail '$PYTHONPATH' '$ENV{PYTHONPATH}'
293
293
+
'';
300
294
301
295
nativeBuildInputs =
302
296
[
···
366
362
outlines
367
363
pandas
368
364
prometheus-fastapi-instrumentator
369
369
-
psutil
370
365
py-cpuinfo
371
366
pyarrow
372
367
pydantic
···
395
392
opentelemetry-api
396
393
opentelemetry-exporter-otlp
397
394
bitsandbytes
395
395
+
# vLLM needs Torch's compiler to be present in order to use torch.compile
396
396
+
torch.stdenv.cc
398
397
]
399
398
++ uvicorn.optional-dependencies.standard
400
399
++ aioprometheus.optional-dependencies.starlette
400
400
+
++ lib.optionals stdenv.targetPlatform.isLinux [
401
401
+
py-libnuma
402
402
+
psutil
403
403
+
]
401
404
++ lib.optionals cudaSupport [
402
405
cupy
403
406
pynvml
···
413
404
dontUseCmakeConfigure = true;
414
405
cmakeFlags =
415
406
[
407
407
+
]
408
408
+
++ lib.optionals cudaSupport [
416
409
(lib.cmakeFeature "FETCHCONTENT_SOURCE_DIR_CUTLASS" "${lib.getDev cutlass}")
417
410
(lib.cmakeFeature "FLASH_MLA_SRC_DIR" "${lib.getDev flashmla}")
418
411
(lib.cmakeFeature "VLLM_FLASH_ATTN_SRC_DIR" "${lib.getDev vllm-flash-attn'}")
419
419
-
]
420
420
-
++ lib.optionals cudaSupport [
421
412
(lib.cmakeFeature "TORCH_CUDA_ARCH_LIST" "${gpuTargetString}")
422
413
(lib.cmakeFeature "CUTLASS_NVCC_ARCHS_ENABLED" "${cudaPackages.flags.cmakeCudaArchitecturesString}")
423
414
(lib.cmakeFeature "CUDA_TOOLKIT_ROOT_DIR" "${symlinkJoin {