Skip to content

Commit e186bed

Browse files
committed
fix
1 parent 91a5e15 commit e186bed

File tree

2 files changed

+8
-6
lines changed

2 files changed

+8
-6
lines changed

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/prefill_node_impl/prefill_impl.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -49,17 +49,17 @@ def init_custom(self):
4949
return
5050

5151
def _pre_handle_finished_reqs(self, finished_reqs):
52-
self._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(run_reqs=finished_reqs)
52+
self._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(finished_reqs=finished_reqs)
5353
return
5454

55-
def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(self, run_reqs: List[InferReq]):
55+
def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(self, finished_reqs: List[InferReq]):
5656
# 提前在radix cache中回收相关的信息,并添加引用进行锁定,方便传输进程传输kv。
5757
if self.is_master_in_dp:
5858
logger.info("prefill_req_handle_and_frozen_tokens")
5959

6060
g_infer_state_lock.acquire()
6161
try:
62-
for req in run_reqs:
62+
for req in finished_reqs:
6363

6464
# 区分abort 和 正常结束的请求,正常结束的请求才发起kv传输任务。
6565
if not req.finish_status.is_finished():

lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/prefill_node_impl/prefill_impl_for_dp.py

Lines changed: 5 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -19,9 +19,11 @@ def init_custom(self):
1919
return
2020

2121
def _pre_handle_finished_reqs(self, finished_reqs):
22-
self._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(run_reqs=finished_reqs)
22+
self._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(finished_reqs=finished_reqs)
2323
return
2424

25-
def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(self, run_reqs: List[InferReq]):
26-
DPChunkedForPrefillNode._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(self, run_reqs=run_reqs)
25+
def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(self, finished_reqs: List[InferReq]):
26+
ChunckedPrefillForPrefillNode._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue(
27+
self, finished_reqs=finished_reqs
28+
)
2729
return

0 commit comments

Comments
 (0)