@@ -872,7 +872,7 @@ def request_match_blocks(self, task: Request, block_size, *args):
872872 read_storage_task = ReadStorageTask (
873873 task_id = req_id ,
874874 keys = no_match_block_keys ,
875- token_ids = input_token_ids ,
875+ token_ids = input_token_ids if self . kvcache_storage_backend == "attention_store" else None ,
876876 gpu_block_ids = gpu_recv_storage_block_ids ,
877877 start_read_block_idx = match_token_num // block_size ,
878878 )
@@ -1111,7 +1111,9 @@ def write_cache_to_storage(self, request: Request):
11111111 if isinstance (token_ids , np .ndarray ):
11121112 token_ids = token_ids .tolist ()
11131113 if self .config .cache_config .enable_output_caching :
1114- token_ids += request .output_token_ids
1114+ input_token_ids = token_ids + request .output_token_ids
1115+ else :
1116+ input_token_ids = token_ids
11151117
11161118 req_id = request .request_id
11171119 keys = []
@@ -1128,7 +1130,7 @@ def write_cache_to_storage(self, request: Request):
11281130 write_storage_task = WriteStorageTask (
11291131 task_id = req_id ,
11301132 keys = keys ,
1131- token_ids = token_ids ,
1133+ token_ids = input_token_ids if self . kvcache_storage_backend == "attention_store" else None ,
11321134 gpu_block_ids = gpu_block_ids ,
11331135 )
11341136 logger .debug (f"issue write storage task: { write_storage_task } " )
@@ -2067,7 +2069,7 @@ def recv_data_transfer_result(self):
20672069 event_type = data [0 ]
20682070
20692071 if event_type .value == CacheStatus .STORAGE2GPU .value :
2070- logger .info (f"recv_data_transfer_result: { data } " )
2072+ logger .debug (f"recv_data_transfer_result: { data } " )
20712073 task_id , hash_keys , block_ids = data [1 :]
20722074 if task_id not in self .storage_prefetch_block_ids :
20732075 self .storage_prefetch_block_ids [task_id ] = []
@@ -2078,7 +2080,7 @@ def recv_data_transfer_result(self):
20782080 if task_id in self .task_prefetch_event :
20792081 self .task_prefetch_event [task_id ].set ()
20802082 elif event_type .value == CacheStatus .GPU2STORAGE .value :
2081- logger .info (f"recv_data_transfer_result: { data } " )
2083+ logger .debug (f"recv_data_transfer_result: { data } " )
20822084 task_id , hash_keys , block_ids = data [1 :]
20832085 if task_id in self .task_write_back_event :
20842086 self .task_write_back_event [task_id ].set ()
0 commit comments