Skip to content

Commit 91d9e89

Browse files
hiworldwzjwangzaijun
andauthored
fix mem alloc (#627)
Co-authored-by: wangzaijun <[email protected]>
1 parent 01f8324 commit 91d9e89

File tree

2 files changed

+10
-3
lines changed

2 files changed

+10
-3
lines changed

lightllm/common/basemodel/basemodel.py

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -71,8 +71,15 @@ def __init__(self, kvargs):
7171
self._verify_must()
7272
self._verify_params()
7373
self._init_quant()
74-
self._init_weights()
75-
self._init_mem_manager()
74+
75+
# 更连续的显存分配可以有更好的性能
76+
if self.max_total_token_num is None:
77+
self._init_weights()
78+
self._init_mem_manager()
79+
else:
80+
self._init_mem_manager()
81+
self._init_weights()
82+
7683
self._init_kv_move_buffer()
7784
self._check_mem_size()
7885
self._init_req_manager()

lightllm/server/router/model_infer/mode_backend/base_backend.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -85,7 +85,7 @@ def init_model(self, kvargs):
8585
rank=self.tp_rank,
8686
world_size=self.world_size,
8787
)
88-
88+
8989
from lightllm.distributed import set_custom_reduce
9090

9191
set_custom_reduce()

0 commit comments

Comments
 (0)