Allocate blocks from id=1 for HPU (vllm-project#160)

Xaenalt · Aug 6, 2024 · b43c7f9 · b43c7f9
1 parent 14c20a3
commit b43c7f9
Showing 1 changed file with 4 additions and 2 deletions.
diff --git a/vllm/core/block/cpu_gpu_block_allocator.py b/vllm/core/block/cpu_gpu_block_allocator.py
@@ -4,7 +4,7 @@
                                         DeviceAwareBlockAllocator)
 from vllm.core.block.naive_block import NaiveBlock, NaiveBlockAllocator
 from vllm.core.block.prefix_caching_block import PrefixCachingBlockAllocator
-from vllm.utils import Device
+from vllm.utils import Device, is_hpu
 
 
 class CpuGpuBlockAllocator(DeviceAwareBlockAllocator):
@@ -52,7 +52,9 @@ def create(
             - The block IDs are assigned contiguously, with GPU block IDs coming
                 before CPU block IDs.
         """
-        block_ids = list(range(num_gpu_blocks + num_cpu_blocks))
+        # For HPU block ids cannot be equal to 0
+        start_id = 1 if is_hpu() else 0
+        block_ids = list(range(start_id, num_gpu_blocks + num_cpu_blocks))
         gpu_block_ids = block_ids[:num_gpu_blocks]
         cpu_block_ids = block_ids[num_gpu_blocks:]