Spaces:

Akeb0n0
/

ML2_HFtune_basic

Running

Akeb0n0 commited on Apr 5, 2025

Commit

431d797

verified ·

1 Parent(s): 2b4bdc4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -4,13 +4,19 @@ import torch.serialization
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
 @st.cache_resource
-def load_model():
-    checkpoint = torch.load('TinyBERT_cls_model.pt',
                           map_location='cpu',
                           weights_only=False)
     model = AutoModelForSequenceClassification.from_pretrained(
-        "huawei-noah/TinyBERT_General_4L_312D",
         num_labels=len(checkpoint['idx_to_category'])
     )
     model.load_state_dict(checkpoint['model_state_dict'])
@@ -20,7 +26,7 @@ def load_model():
     return model, tokenizer, idx_to_category
-def predict(title, abstract, model, tokenizer, idx_to_category, threshold=0.95):
     text = f"{title} /n {abstract}" if abstract else title
     inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=512)

 from transformers import AutoModelForSequenceClassification, AutoTokenizer
 @st.cache_resource
+def load_model():
+    #trained_model = 'TinyBERT_cls_model.pt'
+    #base_model = 'huawei-noah/TinyBERT_General_4L_312D'
+    trained_model = 'distilbert-base_cls_model.pt'
+    base_model = 'distilbert-base-uncased'
+    checkpoint = torch.load(trained_model,
                           map_location='cpu',
                           weights_only=False)
     model = AutoModelForSequenceClassification.from_pretrained(
+        base_model,
         num_labels=len(checkpoint['idx_to_category'])
     )
     model.load_state_dict(checkpoint['model_state_dict'])
     return model, tokenizer, idx_to_category
+def predict(title, abstract, model, tokenizer, idx_to_category, threshold=0.97):
     text = f"{title} /n {abstract}" if abstract else title
     inputs = tokenizer(text, return_tensors="pt", truncation=True, max_length=512)