Skip to content

Commit b0d6393

Browse files
committed
fix: added stubs to address vllm-project#17159
Signed-off-by: Aaron Pham <[email protected]>
1 parent 909fdaf commit b0d6393

File tree

4 files changed

+475
-2
lines changed

4 files changed

+475
-2
lines changed

pyproject.toml

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -58,7 +58,8 @@ ignore_patterns = [
5858
line-length = 80
5959
exclude = [
6060
# External file, leaving license intact
61-
"examples/other/fp8/quantizer/quantize.py"
61+
"examples/other/fp8/quantizer/quantize.py",
62+
"vllm/vllm_flash_attn/flash_attn_interface.pyi"
6263
]
6364

6465
[tool.ruff.lint.per-file-ignores]

setup.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -378,7 +378,6 @@ def run(self) -> None:
378378
"vllm/vllm_flash_attn/_vllm_fa2_C.abi3.so",
379379
"vllm/vllm_flash_attn/_vllm_fa3_C.abi3.so",
380380
"vllm/vllm_flash_attn/flash_attn_interface.py",
381-
"vllm/vllm_flash_attn/__init__.py",
382381
"vllm/cumem_allocator.abi3.so",
383382
# "vllm/_version.py", # not available in nightly wheels yet
384383
]

vllm/vllm_flash_attn/__init__.py

Lines changed: 14 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,14 @@
1+
# SPDX-License-Identifier: Apache-2.0
2+
3+
from .flash_attn_interface import (fa_version_unsupported_reason,
4+
flash_attn_varlen_func,
5+
flash_attn_with_kvcache,
6+
get_scheduler_metadata,
7+
is_fa_version_supported, sparse_attn_func,
8+
sparse_attn_varlen_func)
9+
10+
__all__ = [
11+
'flash_attn_varlen_func', 'flash_attn_with_kvcache',
12+
'get_scheduler_metadata', 'sparse_attn_func', 'sparse_attn_varlen_func',
13+
'is_fa_version_supported', 'fa_version_unsupported_reason'
14+
]

0 commit comments

Comments
 (0)