requests
tqdm
numpy
IPython
setproctitle

[all]
sglang[srt]
sglang[openai]
sglang[anthropic]
sglang[litellm]

[all_cpu]
sglang[srt_cpu]
sglang[openai]
sglang[anthropic]
sglang[litellm]

[all_hip]
sglang[srt_hip]
sglang[openai]
sglang[anthropic]
sglang[litellm]

[all_hpu]
sglang[srt_hpu]
sglang[openai]
sglang[anthropic]
sglang[litellm]

[all_xpu]
sglang[srt_xpu]
sglang[openai]
sglang[anthropic]
sglang[litellm]

[anthropic]
anthropic>=0.20.0

[dev]
sglang[all]
sglang[test]

[dev_cpu]
sglang[all_cpu]
sglang[test]

[dev_hip]
sglang[all_hip]
sglang[test]

[dev_hpu]
sglang[all_hpu]
sglang[test]

[dev_xpu]
sglang[all_xpu]
sglang[test]

[litellm]
litellm>=1.0.0

[openai]
openai>=1.0
tiktoken

[runtime_common]
aiohttp
decord
fastapi
hf_transfer
huggingface_hub
interegular
modelscope
orjson
outlines<0.1.0,>=0.0.44
packaging
pillow
prometheus-client>=0.20.0
psutil
pydantic
python-multipart
pyzmq>=25.1.2
torchao>=0.7.0
uvicorn
uvloop
xgrammar>=0.1.10

[srt]
sglang[runtime_common]
cuda-python
sgl-kernel>=0.0.3
torch
vllm==0.6.4.post1
flashinfer==0.1.6

[srt_cpu]
sglang[runtime_common]
torch

[srt_hip]
sglang[runtime_common]
torch
vllm==0.6.3.post2.dev1

[srt_hpu]
sglang[runtime_common]

[srt_xpu]
sglang[runtime_common]

[test]
jsonlines
matplotlib
pandas
sentence_transformers
accelerate
peft

[torch_memory_saver]
torch_memory_saver
