Skip to content

Commit 72c5b97

Browse files
authored
Update tpu_worker.py 's typo (#17288)
1 parent fa93cd9 commit 72c5b97

File tree

1 file changed

+2
-2
lines changed

1 file changed

+2
-2
lines changed

vllm/worker/tpu_worker.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -163,8 +163,8 @@ def determine_num_available_blocks(self) -> Tuple[int, int]:
163163
usable_memory_size = int(total_memory_size *
164164
self.cache_config.gpu_memory_utilization)
165165
tpu_kv_cache_bytes = max(usable_memory_size - profiled, 0)
166-
dtype_btyes = get_dtype_size(self.cache_dtype)
167-
block_size_bytes = (dtype_btyes * self.cache_config.block_size *
166+
dtype_bytes = get_dtype_size(self.cache_dtype)
167+
block_size_bytes = (dtype_bytes * self.cache_config.block_size *
168168
num_layers * 2 * head_size * num_kv_heads)
169169
num_tpu_blocks = tpu_kv_cache_bytes // block_size_bytes
170170
num_tpu_blocks = (num_tpu_blocks // 8) * 8 # Round down to 8.

0 commit comments

Comments
 (0)