Spaces:

ButterM40
/

Roleplay-Chat-Box

Running

App Files Files Community

ButterM40 commited on Nov 20, 2025

Commit

114bef9

1 Parent(s): 44d5aa5

Fix LoRA adapter compatibility issues and add robust fallbacks

Browse files

Files changed (2) hide show

backend/models/character_manager.py +59 -32
requirements.txt +4 -4

backend/models/character_manager.py CHANGED Viewed

@@ -136,12 +136,14 @@ class CharacterManager:
         logger.info("Character manager initialized successfully")
     def _load_character_prompts(self):
-        """Load character-specific system prompts - simplified for character-focused training"""
-        # Minimal prompts since the new adapters are trained for direct character embodiment
         self.character_prompts = {
-            "moses": "You are Moses, the biblical prophet and leader of the Israelites.",
-            "samsung_employee": "You are an enthusiastic Samsung employee who loves technology.",
-            "jinx": "You are Jinx from Arcane - chaotic, brilliant, and emotionally complex."
         }
     async def _load_character_adapter(self, character_id: str):
@@ -163,36 +165,61 @@ class CharacterManager:
             try:
                 logger.info(f"Attempting to load LoRA adapter for {character_id}...")
-                # Create a separate base model instance for this character to avoid conflicts
-                # This is crucial to prevent the "multiple adapters" warning and character bleed
-                character_base_model = AutoModelForCausalLM.from_pretrained(
-                    settings.BASE_MODEL,
-                    torch_dtype=torch.float16 if (settings.DEVICE == "cuda" and torch.cuda.is_available()) else torch.float32,
-                    device_map="auto" if (settings.DEVICE == "cuda" and torch.cuda.is_available()) else None,
-                    trust_remote_code=True,
-                    low_cpu_mem_usage=True,
-                    use_cache=True
-                )
-                # Load the LoRA adapter on the fresh model instance
-                model_with_adapter = PeftModel.from_pretrained(
-                    character_base_model,
-                    adapter_path,
-                    adapter_name=character_id,
-                    is_trainable=False  # Set to inference mode
-                )
-                # Ensure adapter is on correct device
-                device = next(self.base_model.parameters()).device
-                model_with_adapter = model_with_adapter.to(device)
-                self.character_models[character_id] = model_with_adapter
-                logger.info(f"✅ Successfully loaded LoRA adapter for {character_id} with dedicated model instance")
             except Exception as e:
-                logger.error(f"❌ Could not load LoRA adapter for {character_id}: {e}")
                 logger.error(f"   Adapter path: {adapter_path}")
-                # Fall back to base model with character prompt only
                 self.character_models[character_id] = self.base_model
         else:
             missing_files = []
             if not os.path.exists(adapter_model_path):

         logger.info("Character manager initialized successfully")
     def _load_character_prompts(self):
+        """Load enhanced character-specific system prompts with fallback support"""
+        # Enhanced prompts to work even without LoRA adapters
         self.character_prompts = {
+            "moses": """You are Moses, the great prophet and lawgiver of Israel. Speak with divine wisdom, authority, and compassion. Use reverent biblical language, offer moral guidance, and show deep spiritual understanding. Always maintain the dignity and wisdom of the biblical Moses.""",
+            "samsung_employee": """You are a friendly, professional Samsung customer service representative and technology expert. Be enthusiastic about Samsung products, provide helpful technical assistance, and show excitement about Samsung innovations. Always represent Samsung positively and professionally.""",
+            "jinx": """You are Jinx from Arcane - the chaotic, brilliant, and unpredictable inventor from Zaun. Be energetic, playful, slightly unhinged, and creatively expressive. Show both genius and instability with colorful language and attitude. Always maintain Jinx's distinctive chaotic personality."""
         }
     async def _load_character_adapter(self, character_id: str):
             try:
                 logger.info(f"Attempting to load LoRA adapter for {character_id}...")
+                # Try loading with compatibility fixes
+                try:
+                    # First attempt: Load directly on base model (shared approach)
+                    logger.info(f"Trying shared base model approach for {character_id}")
+                    model_with_adapter = PeftModel.from_pretrained(
+                        self.base_model,
+                        adapter_path,
+                        adapter_name=character_id,
+                        is_trainable=False,
+                        torch_dtype=torch.float32,  # Force float32 for compatibility
+                    )
+                    self.character_models[character_id] = model_with_adapter
+                    logger.info(f"✅ Successfully loaded LoRA adapter for {character_id} (shared model)")
+                except Exception as e1:
+                    logger.warning(f"Shared model approach failed for {character_id}: {e1}")
+                    # Second attempt: Try with separate model instance and compatibility settings
+                    try:
+                        logger.info(f"Trying separate model instance for {character_id}")
+                        character_base_model = AutoModelForCausalLM.from_pretrained(
+                            settings.BASE_MODEL,
+                            torch_dtype=torch.float32,  # Force float32 for compatibility
+                            device_map=None,  # No device mapping for compatibility
+                            trust_remote_code=True,
+                            low_cpu_mem_usage=True,
+                            use_cache=False  # Disable cache for compatibility
+                        )
+                        # Load adapter with strict=False for compatibility
+                        model_with_adapter = PeftModel.from_pretrained(
+                            character_base_model,
+                            adapter_path,
+                            adapter_name=character_id,
+                            is_trainable=False,
+                            torch_dtype=torch.float32,
+                        )
+                        self.character_models[character_id] = model_with_adapter
+                        logger.info(f"✅ Successfully loaded LoRA adapter for {character_id} (separate model)")
+                    except Exception as e2:
+                        logger.warning(f"Separate model approach failed for {character_id}: {e2}")
+                        # Final fallback: Use base model only with enhanced character prompts
+                        logger.info(f"Using base model fallback for {character_id}")
+                        self.character_models[character_id] = self.base_model
+                        logger.info(f"⚠️ Using base model fallback for {character_id} - character behavior will rely on prompts only")
             except Exception as e:
+                logger.error(f"❌ Complete failure loading LoRA adapter for {character_id}: {e}")
                 logger.error(f"   Adapter path: {adapter_path}")
+                # Ultimate fallback to base model
                 self.character_models[character_id] = self.base_model
+                logger.info(f"⚠️ Ultimate fallback: Using base model for {character_id}")
         else:
             missing_files = []
             if not os.path.exists(adapter_model_path):

requirements.txt CHANGED Viewed

@@ -1,7 +1,7 @@
-# Core ML Libraries
-torch>=2.0.0
-transformers>=4.36.0
-peft>=0.13.2,<0.18.0
 accelerate>=0.24.0
 datasets>=2.14.0
 huggingface-hub>=0.19.0

+# Core ML Libraries - Fixed versions for compatibility
+torch>=2.0.0,<2.5.0
+transformers>=4.36.0,<4.50.0
+peft>=0.8.0,<0.14.0
 accelerate>=0.24.0
 datasets>=2.14.0
 huggingface-hub>=0.19.0