File tree Expand file tree Collapse file tree 2 files changed +16
-3
lines changed Expand file tree Collapse file tree 2 files changed +16
-3
lines changed Original file line number Diff line number Diff line change 1818 MedusaDecodingConfig )
1919from tensorrt_llm .quantization import QuantAlgo
2020
21- from ..conftest import (llm_models_root , parametrize_with_ids , skip_no_nvls ,
22- skip_post_blackwell , skip_pre_ada , skip_pre_blackwell ,
23- skip_pre_hopper )
21+ from ..conftest import (get_sm_version , llm_models_root , parametrize_with_ids ,
22+ skip_no_nvls , skip_post_blackwell , skip_pre_ada ,
23+ skip_pre_blackwell , skip_pre_hopper )
2424from .accuracy_core import (MMLU , CliFlowAccuracyTestHarness , CnnDailymail ,
2525 Humaneval , PassKeyRetrieval64k ,
2626 PassKeyRetrieval128k , SlimPajama6B , ZeroScrolls )
2727
28+ # skip trt flow cases on post-Blackwell-Ultra
29+ if get_sm_version () >= 103 :
30+ pytest .skip (
31+ "TRT workflow tests are not supported on post Blackwell-Ultra architecture" ,
32+ allow_module_level = True )
33+
2834
2935class TestGpt2 (CliFlowAccuracyTestHarness ):
3036 MODEL_NAME = "gpt2"
Original file line number Diff line number Diff line change @@ -391,3 +391,10 @@ accuracy/test_llm_api_pytorch.py::TestQwen3_8B::test_bf16[multi_gpus_no_cache] S
391391triton_server/test_triton.py::test_llava[llava] SKIP (https://nvbugs/5547414)
392392disaggregated/test_workers.py::test_workers_kv_cache_aware_router[TinyLlama-1.1B-Chat-v1.0] SKIP (https://nvbugs/5607238)
393393unittest/executor/test_rpc_proxy.py SKIP (https://nvbugs/5605741)
394+ full:RTX/accuracy/test_llm_api_pytorch.py::TestGemma3_1BInstruct::test_auto_dtype SKIP (https://nvbugs/5569696)
395+ full:RTX/accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_2gpus[tp2-trtllm-auto] SKIP (https://nvbugs/5569719)
396+ full:RTX/accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_2gpus[tp2-trtllm-fp8] SKIP (https://nvbugs/5569719)
397+ full:RTX/accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_2gpus[ep2-trtllm-auto] SKIP (https://nvbugs/5569719)
398+ full:RTX/accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_2gpus[ep2-trtllm-fp8] SKIP (https://nvbugs/5569719)
399+ full:RTX/accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_2gpus[dp2-trtllm-auto] SKIP (https://nvbugs/5569719)
400+ full:RTX/accuracy/test_llm_api_pytorch.py::TestGPTOSS::test_w4_2gpus[dp2-trtllm-fp8] SKIP (https://nvbugs/5569719)
You can’t perform that action at this time.
0 commit comments