Update tpu_worker.py 's typo (vllm-project#17288)

idouba · Yuqi Zhang · commit a895df487aa5 · 2025-05-24T08:02:38.000Z
Signed-off-by: Yuqi Zhang &lt;yuqizhang@google.com&gt;
diff --git a/vllm/worker/tpu_worker.py b/vllm/worker/tpu_worker.py
@@ -163,8 +163,8 @@ def determine_num_available_blocks(self) -> Tuple[int, int]:
         usable_memory_size = int(total_memory_size *
                                  self.cache_config.gpu_memory_utilization)
         tpu_kv_cache_bytes = max(usable_memory_size - profiled, 0)
-        dtype_btyes = get_dtype_size(self.cache_dtype)
-        block_size_bytes = (dtype_btyes * self.cache_config.block_size *
+        dtype_bytes = get_dtype_size(self.cache_dtype)
+        block_size_bytes = (dtype_bytes * self.cache_config.block_size *
                             num_layers * 2 * head_size * num_kv_heads)
         num_tpu_blocks = tpu_kv_cache_bytes // block_size_bytes
         num_tpu_blocks = (num_tpu_blocks // 8) * 8  # Round down to 8.