Skip to content

Commit 90245a3

Browse files
authored
release state cache (#4462)
1 parent 25d9517 commit 90245a3

1 file changed

Lines changed: 2 additions & 0 deletions

File tree

  • lmdeploy/pytorch/engine/model_agent

lmdeploy/pytorch/engine/model_agent/agent.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1208,6 +1208,7 @@ async def sleep(self, level: int = 1):
12081208
if self.dist_config.dp > 1:
12091209
await self.state.to_sleep.wait()
12101210
self.cache_engine = None
1211+
self.state_cache_engine = None
12111212
self.reset_graph_runner()
12121213
device = 'cpu' if level == 1 else 'meta'
12131214
self.patched_model.get_model().to(device=device, non_blocking=True)
@@ -1245,4 +1246,5 @@ def release(self):
12451246
self.reset_graph_runner()
12461247
self.patched_model = None
12471248
self.cache_engine = None
1249+
self.state_cache_engine = None
12481250
torch.cuda.empty_cache()

0 commit comments

Comments
 (0)