Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
OpenDAS
vllm_cscc
Commits
4bc913ae
Unverified
Commit
4bc913ae
authored
Feb 03, 2026
by
shaharmor98
Committed by
GitHub
Feb 03, 2026
Browse files
Feat/add nemotron nano v3 tests (#33345)
parent
fbb3cf69
Changes
6
Show whitespace changes
Inline
Side-by-side
Showing
6 changed files
with
54 additions
and
0 deletions
+54
-0
.buildkite/lm-eval-harness/configs/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.yaml
...-harness/configs/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.yaml
+15
-0
.buildkite/lm-eval-harness/configs/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8.yaml
...l-harness/configs/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8.yaml
+19
-0
.buildkite/lm-eval-harness/configs/models-large-hopper.txt
.buildkite/lm-eval-harness/configs/models-large-hopper.txt
+1
-0
.buildkite/lm-eval-harness/configs/models-large.txt
.buildkite/lm-eval-harness/configs/models-large.txt
+1
-0
tests/config/base_model_arch_groundtruth.json
tests/config/base_model_arch_groundtruth.json
+17
-0
tests/config/test_model_arch_config.py
tests/config/test_model_arch_config.py
+1
-0
No files found.
.buildkite/lm-eval-harness/configs/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.yaml
0 → 100644
View file @
4bc913ae
model_name
:
"
nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16"
tasks
:
-
name
:
"
gsm8k"
metrics
:
-
name
:
"
exact_match,strict-match"
value
:
0.695
-
name
:
"
exact_match,flexible-extract"
value
:
0.447
limit
:
1319
num_fewshot
:
5
max_model_len
:
262144
enforce_eager
:
false
apply_chat_template
:
true
fewshot_as_multiturn
:
true
trust_remote_code
:
true
\ No newline at end of file
.buildkite/lm-eval-harness/configs/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8.yaml
0 → 100644
View file @
4bc913ae
model_name
:
"
nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-FP8"
tasks
:
-
name
:
"
gsm8k"
metrics
:
-
name
:
"
exact_match,strict-match"
value
:
0.7142
-
name
:
"
exact_match,flexible-extract"
value
:
0.4579
env_vars
:
VLLM_USE_FLASHINFER_MOE_FP8
:
"
1"
VLLM_FLASHINFER_MOE_BACKEND
:
"
throughput"
limit
:
1319
num_fewshot
:
5
max_model_len
:
262144
kv_cache_dtype
:
fp8
enforce_eager
:
false
apply_chat_template
:
true
fewshot_as_multiturn
:
true
trust_remote_code
:
true
.buildkite/lm-eval-harness/configs/models-large-hopper.txt
View file @
4bc913ae
Qwen3-235B-A22B-Instruct-2507-FP8.yaml
NVIDIA-Nemotron-3-Nano-30B-A3B-FP8.yaml
.buildkite/lm-eval-harness/configs/models-large.txt
View file @
4bc913ae
...
...
@@ -3,3 +3,4 @@ Meta-Llama-3-70B-Instruct.yaml
Mixtral-8x7B-Instruct-v0.1.yaml
Qwen2-57B-A14-Instruct.yaml
DeepSeek-V2-Lite-Chat.yaml
NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.yaml
tests/config/base_model_arch_groundtruth.json
View file @
4bc913ae
...
...
@@ -355,5 +355,22 @@
"is_deepseek_mla"
:
true
,
"is_multimodal_model"
:
false
,
"dtype"
:
"torch.float32"
},
"nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16"
:
{
"architectures"
:
[
"NemotronHForCausalLM"
],
"model_type"
:
"nemotron_h"
,
"text_model_type"
:
"nemotron_h"
,
"hidden_size"
:
2688
,
"total_num_hidden_layers"
:
52
,
"total_num_attention_heads"
:
32
,
"head_size"
:
128
,
"vocab_size"
:
131072
,
"total_num_kv_heads"
:
2
,
"num_experts"
:
128
,
"is_deepseek_mla"
:
false
,
"is_multimodal_model"
:
false
,
"dtype"
:
"torch.bfloat16"
}
}
tests/config/test_model_arch_config.py
View file @
4bc913ae
...
...
@@ -14,6 +14,7 @@ from vllm.transformers_utils.model_arch_config_convertor import (
BASE_TRUST_REMOTE_CODE_MODELS
=
{
"nvidia/Llama-3_3-Nemotron-Super-49B-v1"
,
"nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16"
,
"XiaomiMiMo/MiMo-7B-RL"
,
# Excluded: Not available online right now
# "FreedomIntelligence/openPangu-Ultra-MoE-718B-V1.1",
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment