File tree Expand file tree Collapse file tree 2 files changed +8
-6
lines changed
lightllm/server/router/model_infer/mode_backend/continues_batch/pd_mode/prefill_node_impl Expand file tree Collapse file tree 2 files changed +8
-6
lines changed Original file line number Diff line number Diff line change @@ -49,17 +49,17 @@ def init_custom(self):
49
49
return
50
50
51
51
def _pre_handle_finished_reqs (self , finished_reqs ):
52
- self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (run_reqs = finished_reqs )
52
+ self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (finished_reqs = finished_reqs )
53
53
return
54
54
55
- def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , run_reqs : List [InferReq ]):
55
+ def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , finished_reqs : List [InferReq ]):
56
56
# 提前在radix cache中回收相关的信息,并添加引用进行锁定,方便传输进程传输kv。
57
57
if self .is_master_in_dp :
58
58
logger .info ("prefill_req_handle_and_frozen_tokens" )
59
59
60
60
g_infer_state_lock .acquire ()
61
61
try :
62
- for req in run_reqs :
62
+ for req in finished_reqs :
63
63
64
64
# 区分abort 和 正常结束的请求,正常结束的请求才发起kv传输任务。
65
65
if not req .finish_status .is_finished ():
Original file line number Diff line number Diff line change @@ -19,9 +19,11 @@ def init_custom(self):
19
19
return
20
20
21
21
def _pre_handle_finished_reqs (self , finished_reqs ):
22
- self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (run_reqs = finished_reqs )
22
+ self ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (finished_reqs = finished_reqs )
23
23
return
24
24
25
- def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , run_reqs : List [InferReq ]):
26
- DPChunkedForPrefillNode ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , run_reqs = run_reqs )
25
+ def _prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (self , finished_reqs : List [InferReq ]):
26
+ ChunckedPrefillForPrefillNode ._prefill_req_frozen_tokens_and_put_to_kvmove_taskqueue (
27
+ self , finished_reqs = finished_reqs
28
+ )
27
29
return
You can’t perform that action at this time.
0 commit comments