|
@@ -176,7 +176,7 @@ class BlockSpaceManager:
|
|
|
return len(blocks) <= self.cpu_allocator.get_num_free_blocks()
|
|
|
|
|
|
def swap_out(self, seq_group: SequenceGroup) -> Dict[int, int]:
|
|
|
- # GPU block -> CPU block
|
|
|
+ # GPU block -> CPU block.
|
|
|
mapping: Dict[PhysicalTokenBlock, PhysicalTokenBlock] = {}
|
|
|
for seq in seq_group.get_seqs():
|
|
|
if seq.is_finished():
|
|
@@ -189,9 +189,10 @@ class BlockSpaceManager:
|
|
|
cpu_block = mapping[gpu_block]
|
|
|
cpu_block.ref_count += 1
|
|
|
else:
|
|
|
- cpu_block = self.cpu_allocator.allocate
|
|
|
+ cpu_block = self.cpu_allocator.allocate()
|
|
|
mapping[gpu_block] = cpu_block
|
|
|
new_block_table.append(cpu_block)
|
|
|
+ # Free the GPU block swapped out to CPU.
|
|
|
self.gpu_allocator.free(gpu_block)
|
|
|
self.block_tables[seq.seq_id] = new_block_table
|
|
|
|