From 527c5e799ab40c2dd5c238b46e3f68bcbc7404e1 Mon Sep 17 00:00:00 2001 From: Pensieve Intern Date: Mon, 15 Jun 2026 13:14:44 +0000 Subject: [PATCH] Add Gemma 4 E4B MTP vLLM speedbench cell Signed-off-by: Pensieve Intern --- .../specdec_bench/_cells/gemma-4-E4B-it_mtp_vllm_t0_d7.yaml | 4 ++++ 1 file changed, 4 insertions(+) create mode 100644 tools/launcher/common/specdec_bench/_cells/gemma-4-E4B-it_mtp_vllm_t0_d7.yaml diff --git a/tools/launcher/common/specdec_bench/_cells/gemma-4-E4B-it_mtp_vllm_t0_d7.yaml b/tools/launcher/common/specdec_bench/_cells/gemma-4-E4B-it_mtp_vllm_t0_d7.yaml new file mode 100644 index 00000000000..552e786b797 --- /dev/null +++ b/tools/launcher/common/specdec_bench/_cells/gemma-4-E4B-it_mtp_vllm_t0_d7.yaml @@ -0,0 +1,4 @@ +sampling_kwargs: + temperature: 0 +engine_args: + max_model_len: 65536