2024-08-15 22:38:56 -07:00
|
|
|
import pytest
|
|
|
|
|
2024-10-10 12:39:36 -07:00
|
|
|
from vllm.compilation.levels import CompilationLevel
|
2024-08-15 22:38:56 -07:00
|
|
|
|
2024-10-10 12:39:36 -07:00
|
|
|
from ..utils import fork_new_process_for_each_test
|
2024-09-25 10:35:52 -04:00
|
|
|
from .utils import TEST_MODELS, check_full_graph_support
|
2024-09-14 09:46:04 -07:00
|
|
|
|
|
|
|
|
2024-09-25 10:35:52 -04:00
|
|
|
@pytest.mark.parametrize("model_info", TEST_MODELS)
|
2024-10-10 12:39:36 -07:00
|
|
|
@pytest.mark.parametrize(
|
|
|
|
"optimization_level",
|
2024-10-29 23:03:49 -07:00
|
|
|
[CompilationLevel.DYNAMO_ONCE, CompilationLevel.PIECEWISE])
|
2024-10-10 12:39:36 -07:00
|
|
|
@fork_new_process_for_each_test
|
|
|
|
def test_full_graph(model_info, optimization_level):
|
2024-09-25 10:35:52 -04:00
|
|
|
model = model_info[0]
|
|
|
|
model_kwargs = model_info[1]
|
2024-10-10 12:39:36 -07:00
|
|
|
check_full_graph_support(model,
|
|
|
|
model_kwargs,
|
|
|
|
optimization_level,
|
|
|
|
tp_size=1)
|