Skip to content

Commit 5be08ac

Browse files
committed
up
1 parent f2ab39b commit 5be08ac

File tree

1 file changed

+3
-0
lines changed

1 file changed

+3
-0
lines changed

fastdeploy/engine/common_engine.py

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -436,6 +436,9 @@ def _insert_prefilled_requests(self, request_outputs: List[RequestOutput]):
436436

437437
cur_req.prompt_token_ids[0] = req_out.outputs.token_ids[0]
438438
cur_req.num_cached_tokens = req_out.num_cached_tokens
439+
req_out.metrics.decode_recv_req_time = cur_req.metrics.decode_recv_req_time
440+
req_out.metrics.decode_preallocat_req_time = cur_req.metrics.decode_preallocat_req_time
441+
cur_req.metrics = req_out.metrics
439442
cur_req.metrics.decode_inference_start_time = time.time()
440443
if self.cfg.speculative_config.method in ["mtp"] and self.cfg.scheduler_config.splitwise_role == "decode":
441444
cur_req.draft_token_ids = copy.deepcopy(req_out.outputs.draft_token_ids)

0 commit comments

Comments
 (0)