[misc] refactor speculative config (vllm-project#25657)

yyzxw · web-flow · commit 19f76ee68e60 · 2025-09-26T01:22:06.000-07:00
Signed-off-by: zxw &lt;1020938856@qq.com&gt;
diff --git a/vllm/config/speculative.py b/vllm/config/speculative.py
@@ -209,12 +209,9 @@ def __post_init__(self):
 
         if self.model is None and self.num_speculative_tokens is not None:
             # TODO(Shangming): Refactor mtp configuration logic when supporting
-            # mtp acceleration for more models besides deepseek_v3
-            if self.target_model_config and \
-                (self.target_model_config.hf_text_config.model_type \
-                        == "deepseek_v3" or
-                    self.target_model_config.hf_text_config.model_type in
-                        ("mimo","ernie4_5_moe", "qwen3_next")):
+            if (self.target_model_config
+                    and self.target_model_config.hf_text_config.model_type
+                    in ("deepseek_v3", "mimo", "ernie4_5_moe", "qwen3_next")):
                 # use the draft model from the same model:
                 self.model = self.target_model_config.model
                 # Align the quantization of draft model for cases such as
@@ -224,8 +221,9 @@ def __post_init__(self):
             elif self.method in ("ngram", "[ngram]"):
                 self.model = "ngram"
             else:
-                raise ValueError("num_speculative_tokens was provided without "
-                                 "speculative model.")
+                raise ValueError(
+                    "num_speculative_tokens was provided but without "
+                    "speculative model.")
 
         # Automatically configure the method for ngram when "model" is used
         # instead of "method"