Spaces:

moztrk
/

sentinel-api

Runtime error

Mustafa Öztürk commited on Mar 6

Commit

c399765

1 Parent(s): 7a29d91

Collect garbage after quantization to reduce peak RAM

Files changed (1) hide show

app/ml/model_loader.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import torch
 from detoxify import Detoxify
 from transformers import AutoModelForSequenceClassification, AutoTokenizer, pipeline
@@ -33,6 +35,7 @@ def load_system():
                 dtype=torch.qint8,
             )
             model_o.eval()
         except Exception:
             pass
@@ -55,6 +58,7 @@ def load_system():
                 {torch.nn.Linear},
                 dtype=torch.qint8,
             )
         except Exception:
             pass
         try:
@@ -63,6 +67,7 @@ def load_system():
                 {torch.nn.Linear},
                 dtype=torch.qint8,
             )
         except Exception:
             pass

+import gc
 import torch
 from detoxify import Detoxify
 from transformers import AutoModelForSequenceClassification, AutoTokenizer, pipeline
                 dtype=torch.qint8,
             )
             model_o.eval()
+            gc.collect()
         except Exception:
             pass
                 {torch.nn.Linear},
                 dtype=torch.qint8,
             )
+            gc.collect()
         except Exception:
             pass
         try:
                 {torch.nn.Linear},
                 dtype=torch.qint8,
             )
+            gc.collect()
         except Exception:
             pass