We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 25d9517 commit 90245a3Copy full SHA for 90245a3
1 file changed
lmdeploy/pytorch/engine/model_agent/agent.py
@@ -1208,6 +1208,7 @@ async def sleep(self, level: int = 1):
1208
if self.dist_config.dp > 1:
1209
await self.state.to_sleep.wait()
1210
self.cache_engine = None
1211
+ self.state_cache_engine = None
1212
self.reset_graph_runner()
1213
device = 'cpu' if level == 1 else 'meta'
1214
self.patched_model.get_model().to(device=device, non_blocking=True)
@@ -1245,4 +1246,5 @@ def release(self):
1245
1246
1247
self.patched_model = None
1248
1249
1250
torch.cuda.empty_cache()
0 commit comments