Skip to content

Commit 0fc7dad

Browse files
committed
tweaks
Signed-off-by: Juncheng Gu <jcgu@google.com>
1 parent a5ec87d commit 0fc7dad

File tree

1 file changed

+2
-3
lines changed

1 file changed

+2
-3
lines changed

tests/distributed/offload/tpu_offload_connector_scheduler_test.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -10,8 +10,7 @@
1010
from vllm.v1.request import Request
1111

1212
from tpu_inference.distributed.offload.tpu_offload_connector import (
13-
DEFAULT_TPU_OFFLOAD_CPU_CHUNKS, RequestTracker,
14-
TPUOffloadConnectorScheduler)
13+
RequestTracker, TPUOffloadConnectorScheduler)
1514

1615
_DEFAULT_BLOCK_SIZE = 16
1716

@@ -63,7 +62,7 @@ def _scheduler(
6362
block_size: int = _DEFAULT_BLOCK_SIZE,
6463
offload_decode_save: int = 0,
6564
offload_staging_buffer_tokens: int = -1,
66-
offload_num_cpu_chunks: int = DEFAULT_TPU_OFFLOAD_CPU_CHUNKS,
65+
offload_num_cpu_chunks: int = -1,
6766
):
6867
# update config
6968
vllm_config = MockVllmConfig(block_size=block_size)

0 commit comments

Comments
 (0)