
Signed-off-by: sibi <85477603+t-sibiraj@users.noreply.github.com> Signed-off-by: Aaron Pham <contact@aarnphm.xyz> Co-authored-by: Cyrus Leung <cyrus.tl.leung@gmail.com> Co-authored-by: Aaron Pham <contact@aarnphm.xyz>
67 lines
2.2 KiB
Python
67 lines
2.2 KiB
Python
# SPDX-License-Identifier: Apache-2.0
|
|
|
|
import os
|
|
|
|
import pytest
|
|
|
|
from vllm.distributed.utils import get_pp_indices
|
|
|
|
|
|
def test_custom_layer_partition(monkeypatch: pytest.MonkeyPatch):
|
|
|
|
with monkeypatch.context() as m:
|
|
|
|
def _verify(partition_str, num_layers, pp_size, goldens):
|
|
bak = os.environ.get("VLLM_PP_LAYER_PARTITION", None)
|
|
m.setenv("VLLM_PP_LAYER_PARTITION", partition_str)
|
|
for pp_rank, golden in enumerate(goldens):
|
|
assert get_pp_indices(num_layers, pp_rank, pp_size) == golden
|
|
if bak is not None:
|
|
m.setenv("VLLM_PP_LAYER_PARTITION", bak)
|
|
|
|
# Even partition
|
|
_verify("5,5,5,5", 20, 4, [(0, 5), (5, 10), (10, 15), (15, 20)])
|
|
# Balanced partition
|
|
_verify("4,6,6,4", 20, 4, [(0, 4), (4, 10), (10, 16), (16, 20)])
|
|
# Put reminder somewhere
|
|
_verify("5,6,5,6", 22, 4, [(0, 5), (5, 11), (11, 16), (16, 22)])
|
|
# Invalid partition strings
|
|
with pytest.raises(ValueError):
|
|
_verify("5,5,5,5,", 20, 4, [(0, 5), (5, 10), (10, 15), (15, 20)])
|
|
with pytest.raises(ValueError):
|
|
_verify("5,5,5,a", 20, 4, [(0, 5), (5, 10), (10, 15), (15, 20)])
|
|
# Wrong number of partitions
|
|
with pytest.raises(ValueError):
|
|
_verify("5,5,5", 20, 4, [(0, 5), (5, 10), (10, 15), (15, 20)])
|
|
# Wrong number of layers
|
|
with pytest.raises(ValueError):
|
|
_verify("5,5,5,5", 21, 4, [(0, 5), (5, 10), (10, 15), (15, 20)])
|
|
|
|
|
|
@pytest.mark.parametrize(
|
|
"num_hidden_layers,pp_size,pp_rank,indices",
|
|
[
|
|
# pp_size 2
|
|
(2, 2, 0, (0, 1)),
|
|
(2, 2, 1, (1, 2)),
|
|
(3, 2, 0, (0, 2)),
|
|
(3, 2, 1, (2, 3)),
|
|
# pp_size 3
|
|
(3, 3, 0, (0, 1)),
|
|
(3, 3, 1, (1, 2)),
|
|
(3, 3, 2, (2, 3)),
|
|
(4, 3, 0, (0, 1)),
|
|
(4, 3, 1, (1, 3)),
|
|
(4, 3, 2, (3, 4)),
|
|
(5, 3, 0, (0, 2)),
|
|
(5, 3, 1, (2, 4)),
|
|
(5, 3, 2, (4, 5)),
|
|
])
|
|
def test_uneven_auto_partition(
|
|
num_hidden_layers: int,
|
|
pp_size: int,
|
|
pp_rank: int,
|
|
indices: tuple[int, int],
|
|
):
|
|
assert indices == get_pp_indices(num_hidden_layers, pp_rank, pp_size)
|