Skip to content

Commit 98ac0cb

Browse files
authored
[Bugfix] Use ReplicatedLinear for SequenceClassification head (vllm-project#23836)
Signed-off-by: Isotr0py <mozf@mail2.sysu.edu.cn>
1 parent c8b3b29 commit 98ac0cb

File tree

2 files changed

+4
-8
lines changed

2 files changed

+4
-8
lines changed

tests/models/language/pooling/test_qwen3_reranker.py

Lines changed: 2 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -96,8 +96,5 @@ def test_rerank_models_mteb_tp(vllm_runner,
9696
"tensor_parallel_size": 2,
9797
}
9898

99-
mteb_test_rerank_models(Qwen3RerankerHfRunner,
100-
vllm_runner,
101-
model_info,
102-
vllm_extra_kwargs,
103-
atol=1.2e-2)
99+
mteb_test_rerank_models(Qwen3RerankerHfRunner, vllm_runner, model_info,
100+
vllm_extra_kwargs)

vllm/model_executor/models/adapters.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -248,7 +248,7 @@ def as_seq_cls_model(cls: _T) -> _T:
248248
return cls
249249

250250
# Lazy import
251-
from vllm.model_executor.layers.linear import RowParallelLinear
251+
from vllm.model_executor.layers.linear import ReplicatedLinear
252252
from vllm.model_executor.layers.pooler import (ClassifierPooler,
253253
DispatchPooler, Pooler,
254254
PoolingMethod, PoolingType)
@@ -264,10 +264,9 @@ def _init_pooler(self, vllm_config: "VllmConfig", prefix: str = ""):
264264
config = vllm_config.model_config.hf_config
265265
quant_config = vllm_config.quant_config
266266

267-
self.score = RowParallelLinear(
267+
self.score = ReplicatedLinear(
268268
config.hidden_size,
269269
config.num_labels,
270-
input_is_parallel=False,
271270
bias=False,
272271
params_dtype=torch.float32,
273272
quant_config=quant_config,

0 commit comments

Comments
 (0)