diff --git a/vllm/model_executor/layers/fused_moe/fused_moe.py b/vllm/model_executor/layers/fused_moe/fused_moe.py index a3f887b6d2001..3ea6217d7c0ef 100644 --- a/vllm/model_executor/layers/fused_moe/fused_moe.py +++ b/vllm/model_executor/layers/fused_moe/fused_moe.py @@ -708,7 +708,7 @@ def fused_experts_impl(hidden_states: torch.Tensor, elif hidden_states.dtype == torch.float32: compute_type = tl.float32 else: - logger.error(f"Unsupported compute_type for fused_experts_impl: {hidden_states.dtype} !") + raise ValueError(f"Unsupported compute_type: {hidden_states.dtype}") if inplace: out_hidden_states = hidden_states