Fix the order between @staticmethod and @functools.cache

yuantailing · yuantailing · commit 8334235ad233 · 2025-11-11T08:44:12.000Z
Signed-off-by: Tailing Yuan &lt;yuantailing@gmail.com&gt;
diff --git a/tensorrt_llm/tools/layer_wise_benchmarks/deepseekv3_runner.py b/tensorrt_llm/tools/layer_wise_benchmarks/deepseekv3_runner.py
@@ -62,8 +62,8 @@ def apply(self, router_logits) -> (torch.Tensor, torch.Tensor):
             raise NotImplementedError(f"Not support balance_method {self.balance_method}")
         return token_selected_experts, token_final_scales
 
-    @functools.cache
     @staticmethod
+    @functools.cache
     def get_balanced_selection(num_tokens, top_k, num_experts, dtype, world_size, rank):
         a = torch.arange(num_tokens * world_size * top_k, dtype=dtype, device="cuda").view(
             num_tokens, world_size, top_k
@@ -90,8 +90,8 @@ def apply_balance_ratio(imbalanced_experts, num_experts, balance_ratio, world_si
         mixed_experts[num_balanced_tokens:] = imbalanced_experts[num_balanced_tokens:]
         return mixed_experts
 
-    @functools.cache
     @staticmethod
+    @functools.cache
     def get_all_to_one_selection(
         num_tokens, top_k, num_experts, balance_ratio, dtype, world_size, rank
     ):
@@ -103,8 +103,8 @@ def get_all_to_one_selection(
             imbalanced_experts, num_experts, balance_ratio, world_size, rank
         )
 
-    @functools.cache
     @staticmethod
+    @functools.cache
     def get_balanced_rank_imbalanced_expert_selection(
         num_tokens, top_k, num_experts, balance_ratio, dtype, world_size, rank
     ):