File tree Expand file tree Collapse file tree 3 files changed +4
-0
lines changed
tests/integration/test_lists/qa Expand file tree Collapse file tree 3 files changed +4
-0
lines changed Original file line number Diff line number Diff line change @@ -622,6 +622,7 @@ test_e2e.py::test_qwen_e2e_cpprunner_large_new_tokens[DeepSeek-R1-Distill-Qwen-1
622622test_e2e.py::test_openai_multi_chat_example
623623test_e2e.py::test_openai_consistent_chat
624624test_e2e.py::test_openai_chat_guided_decoding
625+ test_e2e.py::test_openai_chat_harmony
625626test_e2e.py::test_trtllm_benchmark_serving[llama-3.1-model/Meta-Llama-3.1-8B]
626627test_e2e.py::test_trtllm_benchmark_serving[gpt_oss/gpt-oss-20b]
627628test_e2e.py::test_trtllm_multimodal_benchmark_serving
@@ -745,6 +746,7 @@ disaggregated/test_disaggregated_single_gpu.py::test_disaggregated_simple_qwen3[
745746disaggregated/test_disaggregated_single_gpu.py::test_disaggregated_simple_qwen3[True-True-Qwen3-8B-FP8]
746747disaggregated/test_disaggregated.py::test_disaggregated_ctxtp2pp2_gentp2pp2[TinyLlama-1.1B-Chat-v1.0]
747748disaggregated/test_disaggregated.py::test_disaggregated_ctxpp4_genpp4[TinyLlama-1.1B-Chat-v1.0]
749+ disaggregated/test_disaggregated.py::test_disaggregated_kv_cache_time_output[TinyLlama-1.1B-Chat-v1.0]
748750disaggregated/test_workers.py::test_workers_conditional_disaggregation[TinyLlama-1.1B-Chat-v1.0]
749751disaggregated/test_workers.py::test_workers_kv_cache_events[TinyLlama-1.1B-Chat-v1.0]
750752disaggregated/test_workers.py::test_workers_kv_cache_aware_router[TinyLlama-1.1B-Chat-v1.0]
Original file line number Diff line number Diff line change @@ -207,6 +207,7 @@ disaggregated/test_workers.py::test_workers_conditional_disaggregation[TinyLlama
207207disaggregated/test_workers.py::test_workers_kv_cache_aware_router_eviction[TinyLlama-1.1B-Chat-v1.0]
208208disaggregated/test_workers.py::test_workers_kv_cache_aware_router[TinyLlama-1.1B-Chat-v1.0]
209209disaggregated/test_workers.py::test_workers_kv_cache_events[TinyLlama-1.1B-Chat-v1.0]
210+ test_e2e.py::test_openai_chat_harmony
210211test_e2e.py::test_openai_consistent_chat
211212test_e2e.py::test_openai_multi_chat_example
212213test_e2e.py::test_ptp_quickstart
Original file line number Diff line number Diff line change @@ -173,6 +173,7 @@ accuracy/test_llm_api_pytorch.py::TestQwQ_32B::test_auto_dtype_tp4
173173accuracy/test_llm_api_pytorch.py::TestCodestral_22B_V01::test_auto_dtype
174174accuracy/test_llm_api_pytorch.py::TestKimiK2::test_fp8_blockscale[latency]
175175
176+ test_e2e.py::test_openai_chat_harmony
176177test_e2e.py::test_ptp_quickstart_advanced_8gpus[Nemotron-Ultra-253B-nemotron-nas/Llama-3_1-Nemotron-Ultra-253B-v1]
177178test_e2e.py::test_ptp_quickstart_advanced[Nemotron4_4B-BF16-nemotron/Minitron-4B-Base]
178179test_e2e.py::test_ptp_quickstart_advanced[Nemotron-H-8B-Nemotron-H-8B-Base-8K]
You can’t perform that action at this time.
0 commit comments