7070 - VLLM_ATTENTION_BACKEND=XFORMERS pytest -v -s basic_correctness/test_chunked_prefill.py
7171 - VLLM_ATTENTION_BACKEND=FLASH_ATTN pytest -v -s basic_correctness/test_chunked_prefill.py
7272 - VLLM_TEST_ENABLE_ARTIFICIAL_PREEMPT=1 pytest -v -s basic_correctness/test_preemption.py
73-
73+
7474- label : Core Test # 10min
7575 mirror_hardwares : [amd]
7676 fast_check : true
@@ -90,8 +90,11 @@ steps:
9090 commands :
9191 - pip install -e ./plugins/vllm_add_dummy_model
9292 - pip install git+https://github.com/EleutherAI/lm-evaluation-harness.git@a4987bba6e9e9b3f22bd3a6c1ecf0abd04fd5622#egg=lm_eval[api]
93- - pytest -v -s entrypoints/llm --ignore=entrypoints/llm/test_lazy_outlines.py
93+ - pytest -v -s entrypoints/llm --ignore=entrypoints/llm/test_lazy_outlines.py --ignore=entrypoints/llm/test_generate.py --ignore=entrypoints/llm/test_generate_multiple_loras.py --ignore=entrypoints/llm/test_guided_generate.py
9494 - pytest -v -s entrypoints/llm/test_lazy_outlines.py # it needs a clean process
95+ - pytest -v -s entrypoints/llm/test_generate.py # it needs a clean process
96+ - pytest -v -s entrypoints/llm/test_generate_multiple_loras.py # it needs a clean process
97+ - pytest -v -s entrypoints/llm/test_guided_generate.py # it needs a clean process
9598 - pytest -v -s entrypoints/openai
9699 - pytest -v -s entrypoints/test_chat_utils.py
97100 - pytest -v -s entrypoints/offline_mode # Needs to avoid interference with other tests
@@ -207,6 +210,21 @@ steps:
207210 command : pytest -v -s lora --shard-id=$$BUILDKITE_PARALLEL_JOB --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT --ignore=lora/test_long_context.py
208211 parallelism : 4
209212
213+ - label : " PyTorch Fullgraph Smoke Test"
214+ fast_check : true
215+ source_file_dependencies :
216+ - vllm/
217+ - tests/compile
218+ commands :
219+ - pytest -v -s compile/test_full_graph_smoke.py
220+
221+ - label : " PyTorch Fullgraph Test"
222+ source_file_dependencies :
223+ - vllm/
224+ - tests/compile
225+ commands :
226+ - pytest -v -s compile/test_full_graph.py
227+
210228- label : Kernels Test %N # 30min each
211229 mirror_hardwares : [amd]
212230 source_file_dependencies :
@@ -352,7 +370,7 @@ steps:
352370 - tests/distributed/
353371 - vllm/compilation
354372 commands :
355- - pytest -v -s ./compile/test_full_graph .py
373+ - pytest -v -s ./compile/test_full_graph_multi_gpu .py
356374 - pytest -v -s ./compile/test_wrapper.py
357375 - VLLM_TEST_SAME_HOST=1 torchrun --nproc-per-node=4 distributed/test_same_node.py | grep -q 'Same node test passed'
358376 - TARGET_TEST_SUITE=L4 pytest basic_correctness/ -v -s -m distributed_2_gpus
0 commit comments