vllm/tests/tensorizer_loader/conftest.py

import contextlib
import functools
import gc
from typing import Callable, TypeVar

import pytest
import ray
import torch
from typing_extensions import ParamSpec

from vllm.distributed import (destroy_distributed_environment,
                              destroy_model_parallel)
from vllm.model_executor.model_loader.tensorizer import TensorizerConfig


@pytest.fixture(autouse=True)
def cleanup():
    destroy_model_parallel()
    destroy_distributed_environment()
    with contextlib.suppress(AssertionError):
        torch.distributed.destroy_process_group()
    ray.shutdown()
    gc.collect()
    torch.cuda.empty_cache()


_P = ParamSpec("_P")
_R = TypeVar("_R")


def retry_until_skip(n: int):

    def decorator_retry(func: Callable[_P, _R]) -> Callable[_P, _R]:

        @functools.wraps(func)
        def wrapper_retry(*args: _P.args, **kwargs: _P.kwargs) -> _R:
            for i in range(n):
                try:
                    return func(*args, **kwargs)
                except AssertionError:
                    gc.collect()
                    torch.cuda.empty_cache()
                    if i == n - 1:
                        pytest.skip(f"Skipping test after {n} attempts.")

            raise AssertionError("Code should not be reached")

        return wrapper_retry

    return decorator_retry


@pytest.fixture(autouse=True)
def tensorizer_config():
    config = TensorizerConfig(tensorizer_uri="vllm")
    return config
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00			`import contextlib`
[Bugfix] Fix tensorizer memory profiling bug during testing (#6881) 2024-07-30 14:48:50 -04:00			`import functools`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00			`import gc`
[mypy] Misc. typing improvements (#7417) 2024-08-13 09:20:20 +08:00			`from typing import Callable, TypeVar`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00
			`import pytest`
			`import ray`
			`import torch`
[mypy] Misc. typing improvements (#7417) 2024-08-13 09:20:20 +08:00			`from typing_extensions import ParamSpec`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00
			`from vllm.distributed import (destroy_distributed_environment,`
			`destroy_model_parallel)`
			`from vllm.model_executor.model_loader.tensorizer import TensorizerConfig`


[Bugfix] Fix tensorizer memory profiling bug during testing (#6881) 2024-07-30 14:48:50 -04:00			`@pytest.fixture(autouse=True)`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00			`def cleanup():`
			`destroy_model_parallel()`
			`destroy_distributed_environment()`
			`with contextlib.suppress(AssertionError):`
			`torch.distributed.destroy_process_group()`
[Bugfix] Fix tensorizer memory profiling bug during testing (#6881) 2024-07-30 14:48:50 -04:00			`ray.shutdown()`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00			`gc.collect()`
			`torch.cuda.empty_cache()`


[mypy] Misc. typing improvements (#7417) 2024-08-13 09:20:20 +08:00			`_P = ParamSpec("_P")`
			`_R = TypeVar("_R")`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00
[mypy] Misc. typing improvements (#7417) 2024-08-13 09:20:20 +08:00
			`def retry_until_skip(n: int):`

			`def decorator_retry(func: Callable[_P, _R]) -> Callable[_P, _R]:`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00
[Bugfix] Fix tensorizer memory profiling bug during testing (#6881) 2024-07-30 14:48:50 -04:00			`@functools.wraps(func)`
[mypy] Misc. typing improvements (#7417) 2024-08-13 09:20:20 +08:00			`def wrapper_retry(args: _P.args, *kwargs: _P.kwargs) -> _R:`
[Bugfix] Fix tensorizer memory profiling bug during testing (#6881) 2024-07-30 14:48:50 -04:00			`for i in range(n):`
			`try:`
			`return func(args, *kwargs)`
			`except AssertionError:`
			`gc.collect()`
			`torch.cuda.empty_cache()`
			`if i == n - 1:`
[mypy] Misc. typing improvements (#7417) 2024-08-13 09:20:20 +08:00			`pytest.skip(f"Skipping test after {n} attempts.")`

			`raise AssertionError("Code should not be reached")`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00
[Bugfix] Fix tensorizer memory profiling bug during testing (#6881) 2024-07-30 14:48:50 -04:00			`return wrapper_retry`

			`return decorator_retry`
[Bugfix]: Fix Tensorizer test failures (#6835) 2024-07-26 23:02:25 -04:00

			`@pytest.fixture(autouse=True)`
			`def tensorizer_config():`
			`config = TensorizerConfig(tensorizer_uri="vllm")`
[Bugfix] Fix tensorizer memory profiling bug during testing (#6881) 2024-07-30 14:48:50 -04:00			`return config`