@@ -812,6 +812,10 @@ steps:
812812 - vllm/model_executor/layers/quantization/utils/flashinfer_utils.py
813813 - vllm/v1/attention/backends/flashinfer.py
814814 - vllm/compilation/
815+ # can affect pattern matching
816+ - vllm/model_executor/layers/layernorm.py
817+ - vllm/model_executor/layers/activation.py
818+ - vllm/model_executor/layers/quantization/input_quant_fp8.py
815819 commands :
816820 - nvidia-smi
817821 - python3 examples/offline_inference/basic/chat.py
@@ -833,7 +837,6 @@ steps:
833837 - pytest -v -s tests/kernels/moe/test_nvfp4_moe.py
834838 - pytest -v -s tests/kernels/moe/test_ocp_mx_moe.py
835839 # Fusion
836- - pytest -v -s tests/compile/test_fusion_all_reduce.py
837840 - pytest -v -s tests/compile/test_fusion_attn.py::test_attention_quant_pattern
838841 - pytest -v -s tests/kernels/moe/test_flashinfer.py
839842 - pytest -v -s tests/compile/test_silu_mul_quant_fusion.py
@@ -1090,7 +1093,7 @@ steps:
10901093 - pytest -s -v test_lm_eval_correctness.py --config-list-file=configs/models-large.txt --tp-size=4
10911094
10921095# #### H200 test #####
1093- - label : Distrubted Tests (H200) # optional
1096+ - label : Distributed Tests (H200) # optional
10941097 gpu : h200
10951098 optional : true
10961099 working_dir : " /vllm-workspace/"
@@ -1110,6 +1113,7 @@ steps:
11101113 commands :
11111114 - pytest -v -s tests/distributed/test_context_parallel.py
11121115 - pytest -v -s tests/distributed/test_nccl_symm_mem_allreduce.py
1116+ - pytest -v -s tests/compile/test_fusion_all_reduce.py
11131117 - pytest -v -s tests/compile/test_fusions_e2e.py::test_tp2_attn_quant_allreduce_rmsnorm
11141118
11151119# #### RL Integration Tests #####
0 commit comments