From 9534298678d8ef855e197fd48f35fea7045138ef Mon Sep 17 00:00:00 2001 From: Yingge He Date: Wed, 14 Aug 2024 10:59:48 -0700 Subject: [PATCH] Longer time for A100 --- ci/L0_backend_vllm/metrics_test/vllm_metrics_test.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/ci/L0_backend_vllm/metrics_test/vllm_metrics_test.py b/ci/L0_backend_vllm/metrics_test/vllm_metrics_test.py index fbe6675f..bea63ede 100644 --- a/ci/L0_backend_vllm/metrics_test/vllm_metrics_test.py +++ b/ci/L0_backend_vllm/metrics_test/vllm_metrics_test.py @@ -127,14 +127,14 @@ def test_vllm_metrics(self): # vllm:time_to_first_token_seconds self.assertEqual(metrics_dict["vllm:time_to_first_token_seconds_count"], 3) - self.assertTrue( - 0 < metrics_dict["vllm:time_to_first_token_seconds_sum"] < 0.0005 - ) + self.assertTrue(0 < metrics_dict["vllm:time_to_first_token_seconds_sum"] < 0.01) + self.assertEqual(metrics_dict["vllm:time_to_first_token_seconds_bucket"], 3) # vllm:time_per_output_token_seconds self.assertEqual(metrics_dict["vllm:time_per_output_token_seconds_count"], 45) self.assertTrue( - 0 <= metrics_dict["vllm:time_per_output_token_seconds_sum"] <= 0.005 + 0 < metrics_dict["vllm:time_per_output_token_seconds_sum"] < 0.1 ) + self.assertEqual(metrics_dict["vllm:time_per_output_token_seconds_bucket"], 45) def test_vllm_metrics_disabled(self): # Test vLLM metrics