Spaces:

HemanM
/

EvoTransformer-v2.1

Runtime error

HemanM commited on Jul 22, 2025

Commit

bf6e0ca

verified ·

1 Parent(s): e22bade

Update watchdog.py

Files changed (1) hide show

watchdog.py CHANGED Viewed

@@ -85,10 +85,16 @@ def retrain_model():
         if input_ids is None:
             return "⚠️ Not enough data to retrain.", None, "Please log more feedback first."
         config = mutate_config()
-        model = EvoTransformerForClassification(config)
         model.train()
         optimizer = torch.optim.Adam(model.parameters(), lr=2e-4)
         loss_fn = torch.nn.CrossEntropyLoss()
@@ -100,6 +106,10 @@ def retrain_model():
             optimizer.step()
             print(f"🔁 Epoch {epoch+1}: Loss = {loss.item():.4f}")
         # Accuracy
         model.eval()
         with torch.no_grad():
@@ -126,8 +136,9 @@ def retrain_model():
         with open(log_path, "w") as f:
             json.dump(history, f, indent=2)
-        # Save model
         model.save_pretrained("trained_model")
         print("✅ EvoTransformer retrained and saved.")
         # Load updated summary + plot

         if input_ids is None:
             return "⚠️ Not enough data to retrain.", None, "Please log more feedback first."
+        device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         config = mutate_config()
+        model = EvoTransformerForClassification(config).to(device)
         model.train()
+        input_ids = input_ids.to(device)
+        attention_masks = attention_masks.to(device)
+        labels = labels.to(device)
         optimizer = torch.optim.Adam(model.parameters(), lr=2e-4)
         loss_fn = torch.nn.CrossEntropyLoss()
             optimizer.step()
             print(f"🔁 Epoch {epoch+1}: Loss = {loss.item():.4f}")
+        # Sanity check logits
+        if logits.shape[-1] < 2:
+            raise ValueError("Logits shape invalid. Retrained model did not output 2 classes.")
         # Accuracy
         model.eval()
         with torch.no_grad():
         with open(log_path, "w") as f:
             json.dump(history, f, indent=2)
+        # Save model + tokenizer
         model.save_pretrained("trained_model")
+        tokenizer.save_pretrained("trained_model")
         print("✅ EvoTransformer retrained and saved.")
         # Load updated summary + plot