vllm@0.20.0

A high-throughput and memory-efficient inference and serving engine for LLMs

2026-04-27 Python <3.15,>=3.10 wheel sdist
安装 (0.20.0)
pip install vllm==0.20.0
poetry add vllm==0.20.0
pipenv install vllm==0.20.0
conda install vllm=0.20.0
依赖 (92)
依赖
regex
cachetools
psutil
sentencepiece
numpy
requests>=2.26.0
tqdm
blake3
py-cpuinfo
transformers!=5.0.*,!=5.1.*,!=5.2.*,!=5.3.*,!=5.4.*,!=5.5.0,>=4.56.0
tokenizers>=0.21.1
safetensors>=0.6.2
protobuf!=6.30.*,!=6.31.*,!=6.32.*,!=6.33.0.*,!=6.33.1.*,!=6.33.2.*,!=6.33.3.*,!=6.33.4.*,>=5.29.6
fastapi[standard]>=0.115.0
aiohttp>=3.13.3
openai>=2.0.0
pydantic>=2.12.0
prometheus_client>=0.18.0
pillow
prometheus-fastapi-instrumentator>=7.0.0
tiktoken>=0.6.0
lm-format-enforcer==0.11.3
llguidance<1.8.0,>=1.7.0; platform_machine == "x86_64" or platform_machine == "arm64" or platform_machine == "aarch64" or platform_machine == "ppc64le"
outlines_core==0.2.14
diskcache==5.6.3
lark==1.2.2
xgrammar<1.0.0,>=0.2.0; platform_machine == "x86_64" or platform_machine == "aarch64" or platform_machine == "arm64" or platform_machine == "s390x" or platform_machine == "ppc64le"
typing_extensions>=4.10
filelock>=3.16.1
partial-json-parser
pyzmq>=25.0.0
msgspec
gguf>=0.17.0
mistral_common[image]>=1.11.3
opencv-python-headless>=4.13.0
pyyaml
six>=1.16.0; python_version > "3.11"
setuptools<81.0.0,>=77.0.3; python_version > "3.11"
einops
compressed-tensors==0.17.0
depyf==0.20.0
cloudpickle
watchfiles
python-json-logger
ninja
pybase64
cbor2
ijson
setproctitle
openai-harmony>=0.0.3
anthropic>=0.71.0
model-hosting-container-standards<1.0.0,>=0.1.14
mcp
opentelemetry-sdk>=1.27.0
opentelemetry-api>=1.27.0
opentelemetry-exporter-otlp>=1.27.0
opentelemetry-semantic-conventions-ai>=0.4.1
numba==0.65.0
torch==2.11.0
torchaudio==2.11.0
torchvision==0.26.0
flashinfer-python==0.6.12
flashinfer-cubin==0.6.12
apache-tvm-ffi==0.1.9
tilelang==0.1.9
nvidia-cudnn-frontend>=1.19.1
fastsafetensors>=0.3.2
nvidia-cutlass-dsl[cu13]==4.5.2
quack-kernels>=0.3.3
tokenspeed-mla==0.1.2
humming-kernels[cu13]==0.1.4
zentorch==2.11.0.0; extra == "zen"
pandas; extra == "bench"
matplotlib; extra == "bench"
seaborn; extra == "bench"
datasets; extra == "bench"
scipy; extra == "bench"
plotly; extra == "bench"
tensorizer==2.10.1; extra == "tensorizer"
fastsafetensors>=0.3.2; extra == "fastsafetensors"
instanttensor>=0.1.5; extra == "instanttensor"
runai-model-streamer[azure,gcs,s3]>=0.15.7; extra == "runai"
av; extra == "audio"
scipy; extra == "audio"
soundfile; extra == "audio"
mistral_common[audio]; extra == "audio"
helion==1.0.0; extra == "helion"
smg-grpc-servicer[vllm]>=0.5.2; extra == "grpc"
opentelemetry-sdk>=1.26.0; extra == "otel"
opentelemetry-api>=1.26.0; extra == "otel"
opentelemetry-exporter-otlp>=1.26.0; extra == "otel"
opentelemetry-semantic-conventions-ai>=0.4.1; extra == "otel"
下载文件
文件名类型Python 版本大小
vllm-0.20.0-cp38-abi3-manylinux_2_35_aarch64.whl bdist_wheel cp38 235776358 bytes
vllm-0.20.0-cp38-abi3-manylinux_2_35_x86_64.whl bdist_wheel cp38 244415937 bytes
vllm-0.20.0.tar.gz sdist source 33508260 bytes
版本列表
0.23.0 2026-06-15
0.22.1 2026-06-05
0.22.0 2026-05-29
0.21.0 2026-05-15
0.20.2 2026-05-10
0.20.1 2026-05-04
0.20.0 2026-04-27
0.19.1 2026-04-18
0.19.0 2026-04-03
0.18.1 2026-03-31
0.18.0 2026-03-20
0.17.1 2026-03-11
0.17.0 2026-03-07
0.16.0 2026-02-26
0.15.1 2026-02-05
0.15.0 2026-01-29
0.14.1 2026-01-24
0.14.0 2026-01-20
0.13.0 2025-12-19
0.12.0 2025-12-03
0.11.2 2025-11-20
0.11.1 2025-11-19
0.11.0 2025-10-04
0.10.2 2025-09-13
0.10.1.1 2025-08-20
0.10.1 2025-08-19
0.10.0 2025-07-25
0.9.2 2025-07-08
0.9.1 2025-06-10
0.9.0.1 2025-05-30
0.9.0 2025-05-28
0.8.5 2025-04-28
0.8.5.post1 2025-05-02
0.8.4 2025-04-15
0.8.3 2025-04-06
0.8.2 2025-03-25
0.8.1 2025-03-19
0.8.0 2025-03-18
0.7.3 2025-02-20
0.7.2 2025-02-06
0.7.1 2025-02-01
0.7.0 2025-01-27
0.6.6 2024-12-27
0.6.6.post1 2024-12-27
0.6.5 2024-12-18
0.6.4 2024-11-15
0.6.4.post1 2024-11-15
0.6.3 2024-10-14
0.6.3.post1 2024-10-17
0.6.2 2024-09-25
0.6.1 2024-09-11
0.6.1.post2 2024-09-13
0.6.1.post1 2024-09-13
0.6.0 2024-09-05
0.5.5 2024-08-23
0.5.4 2024-08-05
0.5.3 2024-07-23
0.5.3.post1 2024-07-23
0.5.2 2024-07-15
0.5.1 2024-07-06
0.5.0 2024-06-11
0.5.0.post1 2024-06-14
0.4.3 2024-06-01
0.4.2 2024-05-05
0.4.1 2024-04-24
0.4.0 2024-03-31
0.4.0.post1 2024-04-03
0.3.3 2024-03-01
0.3.2 2024-02-21
0.3.1 2024-02-17
0.3.0 2024-01-31
0.2.7 2024-01-04
0.2.6 2023-12-17
0.2.5 2023-12-14
0.2.4 2023-12-11
0.2.3 2023-12-03
0.2.2 2023-11-19
0.2.1 2023-10-16
0.2.1.post1 2023-10-17
0.2.0 2023-09-28
0.1.7 2023-09-11
0.1.6 2023-09-08
0.1.5 2023-09-08
0.1.4 2023-08-25
0.1.3 2023-08-02
0.1.2 2023-07-05
0.1.1 2023-06-22
0.1.0 2023-06-20
0.0.1 2023-06-19