vllm_omni.attention.fish_kvcache_attn ¶
can_use_fish_kvcache_attn ¶
can_use_fish_kvcache_attn(
*,
query: Tensor,
key_cache: Tensor,
value_cache: Tensor,
block_table: Tensor | None,
seq_lens: Tensor,
max_query_len: int,
max_seq_len: int,
dcp_world_size: int,
use_cascade: bool,
alibi_slopes: Any,
sliding_window: Any,
output_scale: Tensor | None = None,
output_block_scale: Tensor | None = None,
) -> bool