Skip to content

Commit c0b73ba

Browse files
committed
support pipeline parallel in V1 engine
Signed-off-by: weiguihua2 <weiguihua2@huawei.com>
1 parent d2f5861 commit c0b73ba

File tree

1 file changed

+4
-8
lines changed

1 file changed

+4
-8
lines changed

tests/e2e/multicard/test_pipeline_parallel.py

Lines changed: 4 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -34,11 +34,7 @@
3434
@pytest.mark.parametrize("model", MODELS)
3535
@pytest.mark.parametrize("tp_size", TENSOR_PARALLELS)
3636
@pytest.mark.parametrize("pp_size", PIPELINE_PARALLELS)
37-
@pytest.mark.parametrize("max_tokens", [64])
38-
@pytest.mark.parametrize("temperature", [0.0])
39-
@pytest.mark.parametrize("ignore_eos", [True])
40-
def test_models(model: str, tp_size: int, pp_size: int, max_tokens: int, temperature: int,
41-
ignore_eos: bool) -> None:
37+
def test_models(model: str, tp_size: int, pp_size: int) -> None:
4238
# Create an LLM.
4339
llm = LLM(
4440
model=model,
@@ -49,9 +45,9 @@ def test_models(model: str, tp_size: int, pp_size: int, max_tokens: int, tempera
4945
)
5046
# Prepare sampling_parames
5147
sampling_params = SamplingParams(
52-
max_tokens=max_tokens,
53-
temperature=temperature,
54-
ignore_eos=ignore_eos,
48+
max_tokens=64,
49+
temperature=0,
50+
ignore_eos=True,
5551
)
5652

5753
# Generate texts from the prompts.

0 commit comments

Comments
 (0)