Skip to content

Commit 69c1d90

Browse files
authored
Update model paths to use llm_models_root instead of HF
Signed-off-by: Gal Hubara-Agam <96368689+galagam@users.noreply.github.com>
1 parent b854e14 commit 69c1d90

File tree

1 file changed

+3
-3
lines changed

1 file changed

+3
-3
lines changed

tests/integration/defs/accuracy/test_llm_api_autodeploy.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -264,9 +264,9 @@ class TestNemotronSuperV3(LlmapiAccuracyTestHarness):
264264
"""
265265

266266
MODEL_NAME = "nvidia/NVIDIA-Nemotron-3-Super-120B-012726"
267-
MODEL_PATH_BF16 = f"nvidia/NVIDIA-Nemotron-3-Super-120B-BF16-BF16KV-012726"
268-
MODEL_PATH_FP8 = "nvidia/NVIDIA-Nemotron-3-Super-120B-FP8-FP8KV-012726"
269-
MODEL_PATH_FP4 = f"nvidia/NVIDIA-Nemotron-3-Super-120B-NVFP4-FP8KV-012726"
267+
MODEL_PATH_BF16 = f"{llm_models_root()}/NVIDIA-Nemotron-3-Super-120B-BF16-BF16KV-012726"
268+
MODEL_PATH_FP8 = f"{llm_models_root()}/NVIDIA-Nemotron-3-Super-120B-FP8-FP8KV-012726"
269+
MODEL_PATH_FP4 = f"{llm_models_root()}/NVIDIA-Nemotron-3-Super-120B-NVFP4-FP8KV-012726"
270270

271271
# Set minimum possible seq len + small buffer, for test speed & memory usage
272272
MAX_SEQ_LEN = max(MMLU.MAX_INPUT_LEN + MMLU.MAX_OUTPUT_LEN,

0 commit comments

Comments
 (0)