Revert "Allocate blocks from id=1 for HPU (#160)" (#163)

This reverts commit b43c7f9.
opendatahub-io · Aug 6, 2024 · 37ca17f · 37ca17f
1 parent b43c7f9
commit 37ca17f
Showing 1 changed file with 2 additions and 4 deletions.
diff --git a/vllm/core/block/cpu_gpu_block_allocator.py b/vllm/core/block/cpu_gpu_block_allocator.py
@@ -4,7 +4,7 @@
                                         DeviceAwareBlockAllocator)
 from vllm.core.block.naive_block import NaiveBlock, NaiveBlockAllocator
 from vllm.core.block.prefix_caching_block import PrefixCachingBlockAllocator
-from vllm.utils import Device, is_hpu
+from vllm.utils import Device
 
 
 class CpuGpuBlockAllocator(DeviceAwareBlockAllocator):
@@ -52,9 +52,7 @@ def create(
             - The block IDs are assigned contiguously, with GPU block IDs coming
                 before CPU block IDs.
         """
-        # For HPU block ids cannot be equal to 0
-        start_id = 1 if is_hpu() else 0
-        block_ids = list(range(start_id, num_gpu_blocks + num_cpu_blocks))
+        block_ids = list(range(num_gpu_blocks + num_cpu_blocks))
         gpu_block_ids = block_ids[:num_gpu_blocks]
         cpu_block_ids = block_ids[num_gpu_blocks:]