Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
16 changes: 10 additions & 6 deletions pyproject.toml
Original file line number Diff line number Diff line change
Expand Up @@ -137,19 +137,23 @@ asyncio_default_fixture_loop_scope = "function"

# --8<-- [start:test-markers-definition]
markers = [
"skip_global_cleanup",
"e2e: Tests using end-to-end engine spin-up",
"basic: Basic correctness tests",
"cb: Continuous batching tests",
"cpu: Tests using CPU (i.e. eager) backend",
"compat: backward compatibility tests",
"spyre: Tests using Spyre hardware backend",
"compiler_support_32k: Tests for 32k compiler support",
"cpu: Tests using CPU (i.e. eager) backend",
"decoder: Tests for decoder models",
"e2e: Tests using end-to-end engine spin-up",
"embedding: Tests for embedding models",
"quantized: Tests for quantized models",
"full_model: Tests that use full-sized granite models",
"multi: Tests that require >1 cards",
"other_e2e: ??? Tests for sampling params that take a long time",
"precompilation: Tests the handling of precompiled model catalogs",
"quantized: Tests for quantized models",
"scoring: Tests for scoring and reranking models",
"spyre: Tests using Spyre hardware backend",
"utils: Tests for utility functions",
"worker: Tests for worker logic",
"worker: Tests for worker logic"
]
# --8<-- [end:test-markers-definition]

Expand Down
18 changes: 0 additions & 18 deletions tests/conftest.py
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,6 @@
from spyre_util import (get_spyre_backend_list, get_spyre_model_list,
skip_unsupported_tp_size)
from vllm.connections import global_http_connection
from vllm.distributed import cleanup_dist_env_and_memory

from vllm_spyre import envs

Expand Down Expand Up @@ -176,23 +175,6 @@ def init_test_http_connection():
global_http_connection.reuse_client = False


@pytest.fixture()
def should_do_global_cleanup_after_test(request) -> bool:
"""Allow subdirectories to skip global cleanup by overriding this fixture.
This can provide a ~10x speedup for non-GPU unit tests since they don't need
to initialize torch.
"""

return not request.node.get_closest_marker("skip_global_cleanup")


@pytest.fixture(autouse=True)
def cleanup_fixture(should_do_global_cleanup_after_test: bool):
yield
if should_do_global_cleanup_after_test:
cleanup_dist_env_and_memory()


@pytest.fixture(autouse=True)
def dynamo_reset():
yield
Expand Down
Loading