diff --git a/HuggingFaceTB/SmolLM3-3B/accuracy/tasks.yml b/HuggingFaceTB/SmolLM3-3B/accuracy/tasks.yml index 0b4633c..72dcb0f 100644 --- a/HuggingFaceTB/SmolLM3-3B/accuracy/tasks.yml +++ b/HuggingFaceTB/SmolLM3-3B/accuracy/tasks.yml @@ -2,4 +2,4 @@ tasks: - name: gsm8k metrics: - name: exact_match,strict-match - value: 0 + value: 0.4708 diff --git a/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8/accuracy/server.yml b/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8/accuracy/server.yml new file mode 100644 index 0000000..d11f711 --- /dev/null +++ b/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8/accuracy/server.yml @@ -0,0 +1,3 @@ +trust-remote-code: true +tensor-parallel-size: 4 +max-model-len: 4096 diff --git a/RedHatAI/DeepSeek-R1-0528-quantized.w4a16/accuracy/server.yml b/RedHatAI/DeepSeek-R1-0528-quantized.w4a16/accuracy/server.yml index fbae63f..81cff55 100644 --- a/RedHatAI/DeepSeek-R1-0528-quantized.w4a16/accuracy/server.yml +++ b/RedHatAI/DeepSeek-R1-0528-quantized.w4a16/accuracy/server.yml @@ -1,3 +1,4 @@ max-model-len: 4096 tensor-parallel-size: 8 trust-remote-code: true +gpu_memory_utilization: 0.8 diff --git a/deepseek-ai/DeepSeek-R1-0528/accuracy/tasks.yml b/deepseek-ai/DeepSeek-R1-0528/accuracy/tasks.yml new file mode 100644 index 0000000..0b4633c --- /dev/null +++ b/deepseek-ai/DeepSeek-R1-0528/accuracy/tasks.yml @@ -0,0 +1,5 @@ +tasks: + - name: gsm8k + metrics: + - name: exact_match,strict-match + value: 0 diff --git a/deepseek-ai/DeepSeek-R1-0528/storage.yml b/deepseek-ai/DeepSeek-R1-0528/storage.yml new file mode 100644 index 0000000..fb93360 --- /dev/null +++ b/deepseek-ai/DeepSeek-R1-0528/storage.yml @@ -0,0 +1,3 @@ +# storage configs for https://huggingface.co/deepseek-ai/DeepSeek-R1-0528 +model: hf +data: hf