From 36b49bf32d700e5048a348e78efb93333601f5c0 Mon Sep 17 00:00:00 2001 From: Jan Kaniecki Date: Tue, 10 Sep 2024 15:51:14 +0200 Subject: [PATCH] Skip compilation warnings during warmup phase --- vllm/worker/habana_model_runner.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/worker/habana_model_runner.py b/vllm/worker/habana_model_runner.py index 8d6c386a9975e..b6218f3cc4cfb 100644 --- a/vllm/worker/habana_model_runner.py +++ b/vllm/worker/habana_model_runner.py @@ -1314,7 +1314,7 @@ def warmup_scenario(self, torch.hpu.synchronize() for _ in range(times): inputs = self.prepare_model_input(seqs) - self.execute_model(inputs, kv_caches, warmup_mode=False) + self.execute_model(inputs, kv_caches, warmup_mode=True) torch.hpu.synchronize() gc.collect()