Skip to content

Commit 9fb7562

Browse files
committed
add two configs
1 parent a96d83e commit 9fb7562

File tree

5 files changed

+15
-1
lines changed

5 files changed

+15
-1
lines changed

.buildkite/lm-eval-harness/configs/DeepSeek-V3.yaml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
# For vllm script, with -t option (tensor parallel size).
22
# bash ./run-lm-eval-gsm-vllm-baseline.sh -m deepseek-ai/DeepSeek-V3 -b 32 -l 250 -f 8
33
model_name: "deepseek-ai/DeepSeek-V3"
4+
backend: "vllm"
45
tasks:
56
- name: "gsm8k"
67
metrics:
@@ -11,6 +12,7 @@ tasks:
1112
limit: 50
1213
num_fewshot: 8
1314
trust_remote_code: True
15+
# TODO(zhewenl): we should increase bath_size and seq_len when we have MI300X or other large GPUs.
1416
max_model_len: 1024
1517
batch_size: 1
1618
gpu_memory_utilization: 0.98
Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,11 @@
1+
# For hf script, without -t option (tensor parallel size).
2+
# bash .buildkite/lm-eval-harness/run-lm-eval-gsm-hf-baseline.sh -m meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 -b 32 -l 250 -f 8
3+
model_name: "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8"
4+
backend: "vllm-vlm"
5+
tasks:
6+
- name: "chartqa"
7+
metrics:
8+
- name: "relaxed_accuracy,none"
9+
value: 0.853
10+
limit: 100
11+
num_fewshot: 0

.buildkite/lm-eval-harness/configs/Meta-Llama-4-Maverick-17B-128E-Instruct-FP8.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,7 @@
11
# For hf script, without -t option (tensor parallel size).
22
# bash .buildkite/lm-eval-harness/run-lm-eval-gsm-hf-baseline.sh -m meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 -b 32 -l 250 -f 8
33
model_name: "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8"
4+
backend: "vllm-vlm"
45
tasks:
56
- name: "gsm8k"
67
metrics:
Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1 @@
1-
DeepSeek-V3.yaml
21
Meta-Llama-4-Maverick-17B-128E-Instruct-FP8.yaml
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
Meta-Llama-4-Maverick-17B-128E-Instruct-FP8-MM.yaml

0 commit comments

Comments
 (0)