We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent eb69778 commit 824ce40Copy full SHA for 824ce40
flashinfer/prefill.py
@@ -1951,8 +1951,8 @@ def plan(
1951
sm_scale: Optional[float] = None,
1952
rope_scale: Optional[float] = None,
1953
rope_theta: Optional[float] = None,
1954
- q_data_type: str = "float16",
1955
- kv_data_type: Optional[str] = None,
+ q_data_type: Union[str, torch.dtype] = "float16",
+ kv_data_type: Optional[Union[str, torch.dtype]] = None,
1956
) -> None:
1957
r"""Plan batch prefill/append attention on Ragged KV-Cache for given problem specification.
1958
0 commit comments