Skip to content

Commit c408a6e

Browse files
authored
[vllm, sglang, rollout] fix: Fix a mistake when running run_qwen3_vl-30b-megatron.sh with latest verl and vllm0.12 (#4810)
1 parent 200bc6d commit c408a6e

File tree

3 files changed

+26
-4
lines changed

3 files changed

+26
-4
lines changed

verl/workers/rollout/sglang_rollout/async_sglang_server.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -44,7 +44,12 @@
4444
from verl.workers.config import HFModelConfig, RolloutConfig
4545
from verl.workers.rollout.replica import RolloutMode, RolloutReplica, TokenOutput
4646
from verl.workers.rollout.sglang_rollout.sglang_rollout import ServerAdapter, _set_envs_and_config
47-
from verl.workers.rollout.utils import get_free_port, is_valid_ipv6_address, run_unvicorn
47+
from verl.workers.rollout.utils import (
48+
get_free_port,
49+
get_max_position_embeddings,
50+
is_valid_ipv6_address,
51+
run_unvicorn,
52+
)
4853

4954
logger = logging.getLogger(__file__)
5055
logger.setLevel(logging.INFO)
@@ -83,7 +88,7 @@ def __init__(
8388

8489
self.config: RolloutConfig = omega_conf_to_dataclass(config)
8590
self.model_config: HFModelConfig = omega_conf_to_dataclass(model_config, dataclass_type=HFModelConfig)
86-
self.config.max_model_len = self.model_config.hf_config.max_position_embeddings
91+
self.config.max_model_len = get_max_position_embeddings(self.model_config.hf_config)
8792
self.rollout_mode = rollout_mode
8893
self.workers = workers
8994

verl/workers/rollout/utils.py

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -23,6 +23,18 @@
2323
logger = logging.getLogger(__file__)
2424

2525

26+
def get_max_position_embeddings(hf_config) -> int:
27+
max_len = getattr(hf_config, "max_position_embeddings", None)
28+
if max_len is None:
29+
text_config = getattr(hf_config, "text_config", None)
30+
if text_config is not None:
31+
max_len = getattr(text_config, "max_position_embeddings", None)
32+
33+
if max_len is None:
34+
raise ValueError("max_position_embeddings not found in HFModelConfig!")
35+
return int(max_len)
36+
37+
2638
def is_valid_ipv6_address(address: str) -> bool:
2739
try:
2840
ipaddress.IPv6Address(address)

verl/workers/rollout/vllm_rollout/vllm_async_server.py

Lines changed: 7 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,12 @@
4848
from verl.utils.vllm.vllm_fp8_utils import apply_vllm_fp8_patches
4949
from verl.workers.config import HFModelConfig, RolloutConfig
5050
from verl.workers.rollout.replica import RolloutMode, RolloutReplica, TokenOutput
51-
from verl.workers.rollout.utils import get_free_port, is_valid_ipv6_address, run_unvicorn
51+
from verl.workers.rollout.utils import (
52+
get_free_port,
53+
get_max_position_embeddings,
54+
is_valid_ipv6_address,
55+
run_unvicorn,
56+
)
5257
from verl.workers.rollout.vllm_rollout import vLLMAsyncRollout
5358
from verl.workers.rollout.vllm_rollout.utils import (
5459
VLLM_LORA_INT_ID,
@@ -195,7 +200,7 @@ def __init__(
195200

196201
self.config: RolloutConfig = omega_conf_to_dataclass(config)
197202
self.model_config: HFModelConfig = omega_conf_to_dataclass(model_config, dataclass_type=HFModelConfig)
198-
self.config.max_model_len = self.model_config.hf_config.max_position_embeddings
203+
self.config.max_model_len = get_max_position_embeddings(self.model_config.hf_config)
199204
self.rollout_mode = rollout_mode
200205
self.workers = workers
201206

0 commit comments

Comments
 (0)