diff --git a/vllm/_custom_ops.py b/vllm/_custom_ops.py index e60158898685..28758acf46ff 100644 --- a/vllm/_custom_ops.py +++ b/vllm/_custom_ops.py @@ -1180,7 +1180,6 @@ def gptq_marlin_repack( if hasattr(torch.ops._C, "gptq_marlin_repack"): - @register_fake("_C::gptq_marlin_repack") def _gptq_marlin_repack_fake( b_q_weight: torch.Tensor, perm: torch.Tensor, @@ -1213,7 +1212,6 @@ def awq_marlin_repack( if hasattr(torch.ops._C, "awq_marlin_repack"): - @register_fake("_C::awq_marlin_repack") def _awq_marlin_repack_fake( b_q_weight: torch.Tensor, size_k: torch.SymInt,