Skip to content

Commit 6d72170

Browse files
committed
Revert "update itemsize bits"
This reverts commit 47aaea9.
1 parent 89882cc commit 6d72170

File tree

2 files changed

+2
-2
lines changed

2 files changed

+2
-2
lines changed

tpu_inference/kernels/ragged_paged_attention/v3/util.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@ def align_to(x, a):
1313

1414

1515
def get_dtype_bitwidth(dtype):
16-
return dtypes.itemsize_bits(dtype)
16+
return dtypes.bit_width(dtype)
1717

1818

1919
def get_dtype_packing(dtype):

tpu_inference/runner/kv_cache.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -114,7 +114,7 @@ def get_rpa_page_size_bytes(mesh: Mesh, kv_cache_specs: dict[str, Any]) -> int:
114114
assert isinstance(kv_cache_spec, AttentionSpec)
115115

116116
dtype = t2j_dtype(kv_cache_spec.dtype)
117-
bits = dtypes.itemsize_bits(dtype)
117+
bits = dtypes.bit_width(dtype)
118118

119119
kv_cache_shape = get_kv_cache_shape_with_mesh(
120120
mesh=mesh,

0 commit comments

Comments
 (0)