EvolphTech
/

Wildnerve-tlm01_Hybrid_Model

Text Generation

wildnerve_tlm01

Model card Files Files and versions

xet

Community

WildnerveAI commited on May 14, 2025

Commit

234321b

verified ·

1 Parent(s): 1c78d33

Upload load_model_weights.py

Browse files

Files changed (1) hide show

load_model_weights.py +39 -9

load_model_weights.py CHANGED Viewed

@@ -67,7 +67,7 @@ def verify_token():
     # Clean up token format - remove any "Bearer " prefix if present
     if token.startswith("Bearer "):
-        token = token[7:].trip()
         os.environ["HF_TOKEN"] = token  # Store the cleaned token
     token_length = len(token)
@@ -512,21 +512,25 @@ def download_model_files(repo_id_base: str, sub_dir: Optional[str] = None,
         except Exception as e:
             logger.error(f"Failed to download fallback model: {e}")
-    # Try public models if private repositories fail
     if not transformer_path:
-        logger.warning("⚠️ Could not download from private repos, trying public models")
         try:
-            # Try to download from public models directly using model IDs
             public_models = [
-                "gpt2",           # Small but works well
-                "distilgpt2",      # Even smaller
-                "facebook/opt-125m"  # Another small model
             ]
             for model_id in public_models:
-                logger.info(f"Trying public model: {model_id}")
                 try:
-                    transformer_path = download_file(model_id, "pytorch_model.bin", cache_dir, None)
                     if transformer_path:
                         downloaded_files["transformer"] = transformer_path
                         logger.info(f"✅ Successfully downloaded weights from {model_id}")
@@ -536,6 +540,32 @@ def download_model_files(repo_id_base: str, sub_dir: Optional[str] = None,
         except Exception as e:
             logger.error(f"Failed to download public models: {e}")
     # Download SNN weights if transformer weights were found
     if "transformer" in downloaded_files:

     # Clean up token format - remove any "Bearer " prefix if present
     if token.startswith("Bearer "):
+        token = token[7:].strip()  # Fix typo: .trip() -> .strip()
         os.environ["HF_TOKEN"] = token  # Store the cleaned token
     token_length = len(token)
         except Exception as e:
             logger.error(f"Failed to download fallback model: {e}")
+    # Try public models if private repositories fail - ADD MORE PUBLIC MODELS
     if not transformer_path:
+        logger.warning("⚠️ Could not download from private repos, trying public models WITHOUT token")
         try:
+            # Try to download from public models directly using model IDs that don't require authentication
             public_models = [
+                "TinyLlama/TinyLlama-1.1B-Chat-v1.0",  # Try this one first - it's small but good
+                "google/mobilevit-small", # Very small model
+                "prajjwal1/bert-tiny",    # Extremely small BERT
+                "distilbert/distilbert-base-uncased",  # Public DistilBERT
+                "google/bert_uncased_L-2_H-128_A-2",   # Tiny BERT
+                "hf-internal-testing/tiny-random-gptj"  # Super tiny test model
             ]
             for model_id in public_models:
+                logger.info(f"Trying public model WITHOUT token: {model_id}")
                 try:
+                    # IMPORTANT: Don't pass the token for these public models
+                    transformer_path = download_file(model_id, "pytorch_model.bin", cache_dir, token=None)
                     if transformer_path:
                         downloaded_files["transformer"] = transformer_path
                         logger.info(f"✅ Successfully downloaded weights from {model_id}")
         except Exception as e:
             logger.error(f"Failed to download public models: {e}")
+        # If still no weights, try to use a model from the transformers library directly
+        if not transformer_path:
+            try:
+                # Try to use tiny-bert which should be bundled with transformers
+                logger.info("Attempting to use tiny-bert from transformers cache")
+                from transformers import AutoModel, AutoTokenizer
+                model_id = "prajjwal1/bert-tiny"
+                tiny_model = AutoModel.from_pretrained(model_id)
+                tiny_tokenizer = AutoTokenizer.from_pretrained(model_id)
+                # Save the model to a local file we can use
+                tmp_dir = os.path.join(cache_dir or "/tmp/tlm_cache", "tiny-bert")
+                os.makedirs(tmp_dir, exist_ok=True)
+                temp_file = os.path.join(tmp_dir, "pytorch_model.bin")
+                # Save model state dict
+                torch.save(tiny_model.state_dict(), temp_file)
+                logger.info(f"✅ Saved tiny-bert model to {temp_file}")
+                # Add to downloaded files
+                downloaded_files["transformer"] = temp_file
+                transformer_path = temp_file
+            except Exception as e:
+                logger.error(f"Failed to use tiny-bert from transformers: {e}")
     # Download SNN weights if transformer weights were found
     if "transformer" in downloaded_files: