Skip to content

Commit 11b94fe

Browse files
authored
test: skip disaggregated tests on arm (#5070)
Signed-off-by: xinhe-nv <[email protected]>
1 parent a90dd57 commit 11b94fe

File tree

4 files changed

+16
-6
lines changed

4 files changed

+16
-6
lines changed

tests/integration/defs/accuracy/test_disaggregated_serving.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -174,6 +174,7 @@ def generate_async(prompt: str,
174174
disaggregated_server.wait()
175175

176176

177+
@pytest.mark.timeout(3600)
177178
class TestLlama3_1_8BInstruct(LlmapiAccuracyTestHarness):
178179
MODEL_NAME = "meta-llama/Llama-3.1-8B-Instruct"
179180
MODEL_PATH = f"{llm_models_root()}/llama-3.1-model/Llama-3.1-8B-Instruct"
@@ -208,11 +209,12 @@ def test_auto_dtype(self, disable_overlap_scheduler):
208209
task.evaluate(llm)
209210

210211

212+
@pytest.mark.timeout(3600)
213+
@pytest.mark.skip_less_device_memory(140000)
211214
class TestLlama4ScoutInstruct(LlmapiAccuracyTestHarness):
212215
MODEL_NAME = "meta-llama/Llama-4-Scout-17B-16E-Instruct"
213216
MODEL_PATH = f"{llm_models_root()}/llama4-models/Llama-4-Scout-17B-16E-Instruct"
214217

215-
@pytest.mark.skip_device_not_contain(["H200"])
216218
@pytest.mark.parametrize("overlap_scheduler", [False, True])
217219
def test_auto_dtype(self, overlap_scheduler):
218220
ctx_server_config = {"disable_overlap_scheduler": True}
@@ -241,6 +243,7 @@ def test_auto_dtype(self, overlap_scheduler):
241243
task.evaluate(llm)
242244

243245

246+
@pytest.mark.timeout(3600)
244247
class TestDeepSeekV3Lite(LlmapiAccuracyTestHarness):
245248
MODEL_NAME = "deepseek-ai/DeepSeek-V3-Lite"
246249
MODEL_PATH = f"{llm_models_root()}/DeepSeek-V3-Lite/bf16"

tests/integration/defs/conftest.py

Lines changed: 6 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -16,6 +16,7 @@
1616

1717
import datetime
1818
import os
19+
import platform
1920
import re
2021
import shutil
2122
import subprocess as sp
@@ -283,7 +284,6 @@ def gemma_example_root(llm_root, llm_venv):
283284
# and caused pipeline to fail. We manually install gemma dependency as a WAR.
284285
llm_venv.run_cmd(["-m", "pip", "install", "safetensors~=0.4.1", "nltk"])
285286
# Install Jax because it breaks dependency
286-
import platform
287287
google_extension = [
288288
"-f",
289289
"https://storage.googleapis.com/jax-releases/jax_cuda_releases.html"
@@ -1722,8 +1722,6 @@ def qcache_dir(llm_venv, llm_root):
17221722

17231723
quantization_root = os.path.join(llm_root, "examples", "quantization")
17241724

1725-
import platform
1726-
17271725
# Fix the issue that the requirements.txt is not available on aarch64.
17281726
if "aarch64" not in platform.machine() and get_sm_version() >= 89:
17291727
llm_venv.run_cmd([
@@ -1874,7 +1872,11 @@ def check_device_contain(keyword_list):
18741872
reason="This test is only supported in Hopper architecture")
18751873

18761874
skip_no_sm120 = pytest.mark.skipif(get_sm_version() != 120,
1877-
reason="This test is for Blackwell SM120")
1875+
reason="This test is for SM120")
1876+
1877+
skip_arm = pytest.mark.skipif(
1878+
"aarch64" in platform.machine(),
1879+
reason="This test is not supported on ARM architecture")
18781880

18791881

18801882
def skip_fp8_pre_ada(use_fp8):

tests/integration/defs/disaggregated/test_disaggregated.py

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@
1717
import subprocess
1818

1919
import pytest
20-
from defs.conftest import skip_no_hopper
20+
from defs.conftest import skip_arm, skip_no_hopper
2121
from defs.trt_test_alternative import check_call, popen
2222

2323
from tensorrt_llm.logger import logger
@@ -528,6 +528,7 @@ def test_disaggregated_deepseek_v3_lite_fp8_tp1_single_gpu_mtp(
528528

529529

530530
@skip_no_hopper
531+
@skip_arm
531532
@pytest.mark.skip_less_device(4)
532533
@pytest.mark.parametrize("deepseek_v3_model_root", ['DeepSeek-V3-Lite-fp8'],
533534
indirect=True)
@@ -554,6 +555,7 @@ def test_disaggregated_deepseek_v3_lite_fp8_ucx(disaggregated_test_root,
554555

555556

556557
@skip_no_hopper
558+
@skip_arm
557559
@pytest.mark.parametrize("deepseek_v3_model_root", ['DeepSeek-V3-Lite-fp8'],
558560
indirect=True)
559561
def test_disaggregated_deepseek_v3_lite_fp8_nixl(disaggregated_test_root,
@@ -579,6 +581,7 @@ def test_disaggregated_deepseek_v3_lite_fp8_nixl(disaggregated_test_root,
579581

580582

581583
@skip_no_hopper
584+
@skip_arm
582585
@pytest.mark.parametrize("deepseek_v3_model_root", ['DeepSeek-V3-Lite-fp8'],
583586
indirect=True)
584587
def test_disaggregated_deepseek_v3_lite_fp8_ucx_tp1_single_gpu(

tests/integration/test_lists/waives.txt

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -443,3 +443,5 @@ test_e2e.py::test_ptp_quickstart_advanced[Llama3.1-8B-NVFP4-nvfp4-quantized/Meta
443443
test_e2e.py::test_ptp_quickstart_advanced[Mixtral-8x7B-NVFP4-nvfp4-quantized/Mixtral-8x7B-Instruct-v0.1] SKIP (https://nvbugs/5333659)
444444
test_e2e.py::test_ptp_quickstart_advanced[Nemotron-Super-49B-v1-NVFP4-nvfp4-quantized/Llama-3_3-Nemotron-Super-49B-v1_nvfp4_hf] SKIP (https://nvbugs/5333659)
445445
examples/test_multimodal.py::test_llm_multimodal_general[Mistral-Small-3.1-24B-Instruct-2503-pp:1-tp:1-bfloat16-bs:8-cpp_e2e:False-nb:1] SKIP (https://nvbugs/5331031)
446+
accuracy/test_disaggregated_serving.py::TestLlama4ScoutInstruct::test_auto_dtype[True] SKIP (https://nvbugs/5336321)
447+
accuracy/test_disaggregated_serving.py::TestLlama4ScoutInstruct::test_auto_dtype[False] SKIP (https://nvbugs/5336321)

0 commit comments

Comments
 (0)