Spaces:

NextGenTech
/

ngt-ai-platform

Sleeping

GaetanoParente commited on Jan 28

Commit

76955f7

1 Parent(s): 03a98ed

aggiunto recupero modello bert da HF hub

Files changed (6) hide show

.gitignore CHANGED Viewed

	@@ -1 +1 @@
1	- __pycache__/~~data/model/bpo_bert_model/*.safetensors~~


1	+ __pycache__/

README.md CHANGED Viewed

@@ -77,8 +77,6 @@ ngt-ai-platform/
 ├── modules/                # Logica di business
 └── data/
     ├── model/              # CARTELLA MODELLI (Non versionata)
-    │   ├── bpo_bert_model/ # Cartella del modello BERT addestrato
-    │   └── ...             # modelli addestrati da noi
     ├── gallery/            # Immagini di esempio per la Demo
     └── tokenizer/          # tokenizer per la BinaryClassification e MultiClassification

 ├── modules/                # Logica di business
 └── data/
     ├── model/              # CARTELLA MODELLI (Non versionata)
     ├── gallery/            # Immagini di esempio per la Demo
     └── tokenizer/          # tokenizer per la BinaryClassification e MultiClassification

data/model/bpo_bert_model/config.json DELETED Viewed

@@ -1,39 +0,0 @@
-{
-  "activation": "gelu",
-  "architectures": [
-    "DistilBertForSequenceClassification"
-  ],
-  "attention_dropout": 0.1,
-  "bos_token_id": null,
-  "dim": 768,
-  "dropout": 0.1,
-  "dtype": "float32",
-  "eos_token_id": null,
-  "hidden_dim": 3072,
-  "id2label": {
-    "0": "LABEL_0",
-    "1": "LABEL_1",
-    "2": "LABEL_2"
-  },
-  "initializer_range": 0.02,
-  "label2id": {
-    "LABEL_0": 0,
-    "LABEL_1": 1,
-    "LABEL_2": 2
-  },
-  "max_position_embeddings": 512,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
-  "output_past": true,
-  "pad_token_id": 0,
-  "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
-  "tie_word_embeddings": true,
-  "transformers_version": "5.0.0",
-  "use_cache": false,
-  "vocab_size": 119547
-}

data/model/bpo_bert_model/tokenizer.json DELETED Viewed

The diff for this file is too large to render. See raw diff

data/model/bpo_bert_model/tokenizer_config.json DELETED Viewed

@@ -1,14 +0,0 @@
-{
-  "backend": "tokenizers",
-  "cls_token": "[CLS]",
-  "do_lower_case": false,
-  "is_local": false,
-  "mask_token": "[MASK]",
-  "model_max_length": 512,
-  "pad_token": "[PAD]",
-  "sep_token": "[SEP]",
-  "strip_accents": null,
-  "tokenize_chinese_chars": true,
-  "tokenizer_class": "DistilBertTokenizer",
-  "unk_token": "[UNK]"
-}

modules/bpo_dispatcher.py CHANGED Viewed

@@ -17,23 +17,29 @@ LABELS_MAP = {
     2: "Retention / Churn Risk"
 }
 class BPODispatcher:
-    def __init__(self, model_path="data/model/bpo_bert_model"):
         self.model = None
         self.tokenizer = None
         self.nlp = None
-        self.device = "cpu"
-        # 1. BERT
-        if os.path.exists(model_path):
-            try:
-                self.tokenizer = DistilBertTokenizerFast.from_pretrained(model_path)
-                self.model = DistilBertForSequenceClassification.from_pretrained(model_path)
-                self.model.to(self.device)
-                self.model.eval()
-                print("✅ Modello BERT caricato.")
-            except Exception as e:
-                print(f"❌ Errore BERT: {e}")
         # 2. spaCy
         try:

     2: "Retention / Churn Risk"
 }
+MODEL_REPO_ID = "NextGenTech/bpo-bert-model"
 class BPODispatcher:
+    def __init__(self, model_id=MODEL_REPO_ID):
         self.model = None
         self.tokenizer = None
         self.nlp = None
+        self.device = "cpu" # In uno Space CPU basic, usa "cuda" solo se hai GPU
+        # 1. BERT (Caricamento da Hugging Face Hub)
+        print(f"🔄 Tentativo di caricamento modello da: {model_id}...")
+        try:
+            # token=True usa automaticamente il Secret 'HF_TOKEN' dello Space
+            self.tokenizer = DistilBertTokenizerFast.from_pretrained(model_id, token=True)
+            self.model = DistilBertForSequenceClassification.from_pretrained(model_id, token=True)
+            self.model.to(self.device)
+            self.model.eval()
+            print("✅ Modello BERT scaricato e caricato con successo.")
+        except OSError as e:
+            print(f"❌ Errore: Impossibile scaricare il modello. Verifica il Token e il Repo ID.")
+            print(f"Dettagli: {e}")
+        except Exception as e:
+            print(f"❌ Errore generico BERT: {e}")
         # 2. spaCy
         try: