Spaces:

Saint5
/

multimodal_rag_system

Sleeping

Saint5 commited on Aug 21, 2025

Commit

ca11a08

verified ·

1 Parent(s): 2303390

Minor memory tweaks

Files changed (1) hide show

model_setup.py CHANGED Viewed

@@ -2,10 +2,11 @@
 """loading the models to be used by the Mulltimodal RAG system."""
 import torch
 from sentence_transformers import SentenceTransformer
 from transformers import AutoProcessor, Gemma3ForConditionalGeneration, BitsAndBytesConfig
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Embedding model
@@ -33,3 +34,7 @@ model.eval()
 # Processor
 processor = AutoProcessor.from_pretrained(model_name, use_fast=True)

 """loading the models to be used by the Mulltimodal RAG system."""
 import torch
+import gc
 from sentence_transformers import SentenceTransformer
 from transformers import AutoProcessor, Gemma3ForConditionalGeneration, BitsAndBytesConfig
+from utils import clear_gpu_cache
 device = "cuda" if torch.cuda.is_available() else "cpu"
 # Embedding model
 # Processor
 processor = AutoProcessor.from_pretrained(model_name, use_fast=True)
+# Free memory
+clear_gpu_cache()
+gc.collect()