Skip to content

Commit 0358329

Browse files
[fix] initialize available_gpu_block_num with max_gpu_block_num (#4193)
1 parent 01f6934 commit 0358329

1 file changed

Lines changed: 5 additions & 0 deletions

File tree

fastdeploy/cache_manager/prefix_cache_manager.py

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -113,6 +113,10 @@ def __init__(
113113
+ f"{self.num_cpu_blocks}, bytes_per_layer_per_block {self.cache_config.bytes_per_layer_per_block}"
114114
)
115115

116+
main_process_metrics.max_gpu_block_num.set(self.num_gpu_blocks)
117+
main_process_metrics.available_gpu_block_num.set(self.num_gpu_blocks)
118+
main_process_metrics.available_gpu_resource.set(1.0)
119+
116120
@property
117121
def available_gpu_resource(self):
118122
return len(self.gpu_free_block_list) / self.num_gpu_blocks if self.num_gpu_blocks > 0 else 0.0
@@ -269,6 +273,7 @@ def update_cache_config(self, cache_config):
269273
self.node_id_pool = list(range(self.num_gpu_blocks + self.num_cpu_blocks))
270274

271275
main_process_metrics.max_gpu_block_num.set(self.num_gpu_blocks)
276+
main_process_metrics.available_gpu_block_num.set(self.num_gpu_blocks)
272277
main_process_metrics.available_gpu_resource.set(1.0)
273278

274279
def can_allocate_gpu_blocks(self, num_blocks: int):

0 commit comments

Comments
 (0)