File tree Expand file tree Collapse file tree 3 files changed +3
-3
lines changed Expand file tree Collapse file tree 3 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -331,7 +331,6 @@ def compile_or_call(*args):
331331
332332 self .compiled = True
333333
334- logger .info (f"[Mirage] Calling the compiled result..." )
335334 result_hidden_states = self .mpk ()
336335
337336 return (result_hidden_states ,)
Original file line number Diff line number Diff line change @@ -346,7 +346,7 @@ def get_attn_backend_cls(
346346 FLASH_ATTN_V1 = "vllm.v1.attention.backends.flash_attn.FlashAttentionBackend" # noqa: E501
347347 TREE_ATTN_V1 = "vllm.v1.attention.backends.tree_attn.TreeAttentionBackend" # noqa: E501
348348 XFORMERS_V1 = "vllm.v1.attention.backends.xformers.XFormersAttentionBackend" # noqa: E501
349- MIRAGE_V1 = "vllm.v1.attention.backends.mirage.MirageBackend " # noqa: E501
349+ MIRAGE_V1 = "vllm.v1.attention.backends.mirage.MirageAttentionBackend " # noqa: E501
350350
351351 use_fp8_kv_cache = kv_cache_dtype is not None and kv_cache_dtype .startswith (
352352 "fp8"
Original file line number Diff line number Diff line change 2222
2323from vllm .platforms import current_platform
2424from vllm .triton_utils import tl , triton
25- from vllm .utils import cdiv , is_pin_memory_available
25+ from vllm .utils .math_utils import cdiv
26+ from vllm .utils .platform_utils import is_pin_memory_available
2627from vllm .v1 .attention .backends .utils import (
2728 AttentionCGSupport ,
2829 AttentionMetadataBuilder ,
You can’t perform that action at this time.
0 commit comments