File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -68,9 +68,6 @@ def normal_or_p_d_start(args):
6868
6969 set_unique_server_name (args )
7070
71- if not args .disable_shm_warning :
72- check_recommended_shm_size (args )
73-
7471 if args .enable_mps :
7572 from lightllm .utils .device_utils import enable_mps
7673
@@ -108,6 +105,9 @@ def normal_or_p_d_start(args):
108105 if args .enable_multimodal :
109106 args .multi_modal_cache_shm_id = uuid .uuid1 ().int % 123456789
110107
108+ if not args .disable_shm_warning :
109+ check_recommended_shm_size (args )
110+
111111 assert args .zmq_mode in ["tcp://" , "ipc:///tmp/" ]
112112 # 确保单机上多实列不冲突
113113 if args .zmq_mode == "ipc:///tmp/" :
Original file line number Diff line number Diff line change @@ -161,6 +161,3 @@ class StartArgs:
161161 metric_port : int = field (default = None )
162162 multinode_httpmanager_port : int = field (default = 12345 )
163163 multi_level_kv_cache_port : int = field (default = None )
164- # multi_modal
165- enable_multimodal : bool = field (default = False )
166- enable_multimodal_audio : bool = field (default = False )
Original file line number Diff line number Diff line change @@ -444,7 +444,7 @@ async def _encode(
444444 len (multimodal_params .images + multimodal_params .audios ) <= self .args .cache_capacity
445445 ), "too many multimodal items!"
446446 if multimodal_params .audios :
447- assert self .args .enable_multimodal_audio , "audio multimodal not enabled"
447+ assert not self .args .disable_audio , "audio multimodal not enabled"
448448 await self ._alloc_multimodal_resources (multimodal_params , sampling_params )
449449 prompt_ids = self .tokenizer .encode (
450450 prompt , multimodal_params , add_special_tokens = sampling_params .add_special_tokens
Original file line number Diff line number Diff line change 11# first
2- LOADWORKER=18 CUDA_VISIBLE_DEVICES=6,7 python -m lightllm.server.api_server --model_dir /mtc/models/Qwen3-VL-8B-Instruct --tp 2 --port 8089 --enable_multimodal_visual
2+ LOADWORKER=18 CUDA_VISIBLE_DEVICES=6,7 python -m lightllm.server.api_server --model_dir /mtc/models/Qwen3-VL-8B-Instruct --tp 2 --port 8089
33
44# second
55python test_vlm_models.py
You can’t perform that action at this time.
0 commit comments