Skip to content

Commit df724fd

Browse files
authored
Merge pull request #393 from mefich/main
Unloading vision model of VLMs for Exllamav3 backend
2 parents fece479 + 37aea9d commit df724fd

1 file changed

Lines changed: 4 additions & 0 deletions

File tree

backends/exllamav3/model.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -563,6 +563,10 @@ async def unload(self, loras_only: bool = False, **kwargs):
563563
self.draft_config = None
564564
self.draft_cache = None
565565

566+
if self.use_vision:
567+
self.vision_model.unload()
568+
self.vision_model = None
569+
566570
# Cleanup the generator from any pending jobs
567571
if self.generator is not None:
568572
await self.generator.close()

0 commit comments

Comments
 (0)