.gitignore
.readthedocs.yaml
CMakeLists.txt
CODE_OF_CONDUCT.md
DCO
Dockerfile
LICENSE
README.md
README.zh.md
format.sh
mypy.ini
packages.txt
pta_install.sh
pyproject.toml
pytest.ini
requirements-dev.txt
requirements-lint.txt
requirements.txt
setup.py
.github/PULL_REQUEST_TEMPLATE.md
.github/dependabot.yml
.github/labeler.yml
.github/ISSUE_TEMPLATE/100-documentation.yml
.github/ISSUE_TEMPLATE/200-installation.yml
.github/ISSUE_TEMPLATE/300-usage.yml
.github/ISSUE_TEMPLATE/400-bug-report.yml
.github/ISSUE_TEMPLATE/500-feature-request.yml
.github/ISSUE_TEMPLATE/600-new-model.yml
.github/ISSUE_TEMPLATE/700-performance-discussion.yml
.github/ISSUE_TEMPLATE/750-RFC.yml
.github/ISSUE_TEMPLATE/800-others.yml
.github/ISSUE_TEMPLATE/config.yml
.github/workflows/actionlint.yml
.github/workflows/image.yml
.github/workflows/labeler.yml
.github/workflows/mypy.yaml
.github/workflows/ruff.yml
.github/workflows/shellcheck.yml
.github/workflows/vllm_ascend_test.yaml
.github/workflows/yapf.yml
.github/workflows/matchers/actionlint.json
.github/workflows/matchers/mypy.json
.github/workflows/matchers/ruff.json
cmake/utils.cmake
csrc/ops.h
csrc/torch_binding.cpp
csrc/utils.h
csrc/kernels/pos_encoding_kernels.cpp
csrc/kernels/types.h
csrc/kernels/utils.h
docs/Makefile
docs/README.md
docs/requirements-docs.txt
docs/requirements-test.txt
docs/source/conf.py
docs/source/faqs.md
docs/source/index.md
docs/source/installation.md
docs/source/quick_start.md
docs/source/developer_guide/contributing.md
docs/source/developer_guide/contributing.zh.md
docs/source/developer_guide/versioning_policy.md
docs/source/developer_guide/versioning_policy.zh.md
docs/source/logos/vllm-ascend-logo-text-dark.png
docs/source/logos/vllm-ascend-logo-text-light.png
docs/source/tutorials/index.md
docs/source/tutorials/multi_node.md
docs/source/tutorials/multi_npu.md
docs/source/tutorials/single_npu.md
docs/source/tutorials/single_npu_multimodal.md
docs/source/user_guide/release.template.md
docs/source/user_guide/release_notes.md
docs/source/user_guide/supported_models.md
docs/source/user_guide/suppoted_features.md
examples/offline_distributed_inference_npu.py
examples/offline_inference_audio_language.py
examples/offline_inference_npu.py
tests/conftest.py
tests/model_utils.py
tests/test_offline_inference.py
tests/ops/test_rotary_embedding.py
tools/actionlint.sh
tools/check_repo.sh
tools/mypy.sh
tools/png-lint.sh
tools/shellcheck.sh
tools/sphinx-lint.sh
vllm_ascend/__init__.py
vllm_ascend/_version.py
vllm_ascend/communicator.py
vllm_ascend/envs.py
vllm_ascend/patch_module.py
vllm_ascend/platform.py
vllm_ascend/utils.py
vllm_ascend.egg-info/PKG-INFO
vllm_ascend.egg-info/SOURCES.txt
vllm_ascend.egg-info/dependency_links.txt
vllm_ascend.egg-info/entry_points.txt
vllm_ascend.egg-info/requires.txt
vllm_ascend.egg-info/top_level.txt
vllm_ascend/attention/__init__.py
vllm_ascend/attention/attention.py
vllm_ascend/attention/attention_v1.py
vllm_ascend/models/__init__.py
vllm_ascend/models/deepseek_v2.py
vllm_ascend/models/qwen2_vl.py
vllm_ascend/ops/__init__.py
vllm_ascend/ops/activation.py
vllm_ascend/ops/fused_moe.py
vllm_ascend/ops/layernorm.py
vllm_ascend/ops/rotary_embedding.py
vllm_ascend/patch/__init__.py
vllm_ascend/patch/patch_cache_dtype.py
vllm_ascend/patch/patch_metrics.py
vllm_ascend/patch/patch_minicpm.py
vllm_ascend/patch/patch_rejection_sampler.py
vllm_ascend/patch/patch_spec_decode_worker.py
vllm_ascend/patch/ray_patch.py
vllm_ascend/quantization/__init__.py
vllm_ascend/quantization/quant_config.py
vllm_ascend/quantization/quantizer.py
vllm_ascend/worker/__init__.py
vllm_ascend/worker/draft_model_runner.py
vllm_ascend/worker/model_runner.py
vllm_ascend/worker/model_runner_v1.py
vllm_ascend/worker/multi_step_runner.py
vllm_ascend/worker/multi_step_worker.py
vllm_ascend/worker/pooling_model_runner.py
vllm_ascend/worker/worker.py
vllm_ascend/worker/worker_v1.py