From 65419f4423f436879e8ea927221d0b996906ea1b Mon Sep 17 00:00:00 2001 From: Woosuk Kwon Date: Fri, 14 Jun 2024 14:40:09 -0700 Subject: [PATCH] [Bugfix] Fix typo in Pallas backend (#5558) --- vllm/attention/backends/pallas.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/attention/backends/pallas.py b/vllm/attention/backends/pallas.py index 75f2465264ad3..b203c5ec54c92 100644 --- a/vllm/attention/backends/pallas.py +++ b/vllm/attention/backends/pallas.py @@ -110,7 +110,7 @@ def __init__( raise NotImplementedError("TPU version must be 4 or higher.") self.megacore_mode = None - tpu_type = torch_xla.tpu.get_tp_groupu_env()["TYPE"].lower() + tpu_type = torch_xla.tpu.get_tpu_env()["TYPE"].lower() if not tpu_type.endswith("lite"): if self.num_kv_heads % 2 == 0: self.megacore_mode = "kv_head"