diff --git a/.buildkite/performance-benchmarks/tests/serving-tests-arm64-cpu.json b/.buildkite/performance-benchmarks/tests/serving-tests-arm64-cpu.json index 63f1f8ab8..9f226ef2f 100644 --- a/.buildkite/performance-benchmarks/tests/serving-tests-arm64-cpu.json +++ b/.buildkite/performance-benchmarks/tests/serving-tests-arm64-cpu.json @@ -36,6 +36,7 @@ "model": "meta-llama/Llama-3.1-8B-Instruct", "backend": "vllm", "ignore-eos": "", + "temperature": 0, "num_prompts": 200 } }, @@ -127,4 +128,4 @@ } } ] -} \ No newline at end of file +} diff --git a/.buildkite/performance-benchmarks/tests/serving-tests-cpu-asr.json b/.buildkite/performance-benchmarks/tests/serving-tests-cpu-asr.json index f0dc3d5ec..30879b5e9 100644 --- a/.buildkite/performance-benchmarks/tests/serving-tests-cpu-asr.json +++ b/.buildkite/performance-benchmarks/tests/serving-tests-cpu-asr.json @@ -22,6 +22,7 @@ "hf_split": "test", "no_stream": "", "no_oversample": "", + "temperature": 0, "num_prompts": 200 } }, diff --git a/.buildkite/performance-benchmarks/tests/serving-tests-cpu-text.json b/.buildkite/performance-benchmarks/tests/serving-tests-cpu-text.json index 0411b04e1..6c4591f05 100644 --- a/.buildkite/performance-benchmarks/tests/serving-tests-cpu-text.json +++ b/.buildkite/performance-benchmarks/tests/serving-tests-cpu-text.json @@ -26,6 +26,7 @@ "model": "meta-llama/Llama-3.1-8B-Instruct", "backend": "vllm", "ignore-eos": "", + "temperature": 0, "num_prompts": 200 } }, diff --git a/.buildkite/performance-benchmarks/tests/serving-tests-cpu.json b/.buildkite/performance-benchmarks/tests/serving-tests-cpu.json index f66ef2af4..c2d7768e2 100644 --- a/.buildkite/performance-benchmarks/tests/serving-tests-cpu.json +++ b/.buildkite/performance-benchmarks/tests/serving-tests-cpu.json @@ -26,6 +26,7 @@ "model": "meta-llama/Llama-3.1-8B-Instruct", "backend": "vllm", "ignore-eos": "", + "temperature": 0, "num_prompts": 200 } }, diff --git a/.buildkite/performance-benchmarks/tests/serving-tests-hpu.json b/.buildkite/performance-benchmarks/tests/serving-tests-hpu.json index 3929aa5fb..d5ef98168 100644 --- a/.buildkite/performance-benchmarks/tests/serving-tests-hpu.json +++ b/.buildkite/performance-benchmarks/tests/serving-tests-hpu.json @@ -21,6 +21,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -47,6 +48,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -73,6 +75,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -100,6 +103,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -127,6 +131,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -151,6 +156,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } } diff --git a/.buildkite/performance-benchmarks/tests/serving-tests.json b/.buildkite/performance-benchmarks/tests/serving-tests.json index 66d52abc1..36e3d4170 100644 --- a/.buildkite/performance-benchmarks/tests/serving-tests.json +++ b/.buildkite/performance-benchmarks/tests/serving-tests.json @@ -13,6 +13,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -30,6 +31,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -47,6 +49,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }, @@ -67,6 +70,7 @@ "backend": "vllm", "dataset_name": "sharegpt", "dataset_path": "./ShareGPT_V3_unfiltered_cleaned_split.json", + "temperature": 0, "num_prompts": 200 } }