jree423
/

svgdreamer

@@ -14,27 +14,33 @@ import torchvision.transforms as transforms
 import random
 import math
-class SVGDreamerHandler:
-    def __init__(self):
         self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         self.model_id = "runwayml/stable-diffusion-v1-5"
-        # Initialize the diffusion pipeline
-        self.pipe = StableDiffusionPipeline.from_pretrained(
-            self.model_id,
-            torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
-            safety_checker=None,
-            requires_safety_checker=False
-        ).to(self.device)
-        # Use DDIM scheduler for better control
-        self.pipe.scheduler = DDIMScheduler.from_config(self.pipe.scheduler.config)
-        # CLIP model for guidance
-        self.clip_model = self.pipe.text_encoder
-        self.clip_tokenizer = self.pipe.tokenizer
-        print("SVGDreamer handler initialized successfully!")
     def __call__(self, inputs: Union[str, Dict[str, Any]]) -> Image.Image:
         """
@@ -491,18 +497,26 @@ class SVGDreamerHandler:
     def get_text_embeddings(self, prompt: str):
         """Get CLIP text embeddings for the prompt"""
-        with torch.no_grad():
-            text_inputs = self.clip_tokenizer(
-                prompt,
-                padding="max_length",
-                max_length=self.clip_tokenizer.model_max_length,
-                truncation=True,
-                return_tensors="pt"
-            ).to(self.device)
-            text_embeddings = self.clip_model(text_inputs.input_ids)[0]
-        return text_embeddings
     def extract_semantic_features(self, prompt: str):
         """Extract semantic features from prompt"""

 import random
 import math
+class EndpointHandler:
+    def __init__(self, path=""):
         self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
         self.model_id = "runwayml/stable-diffusion-v1-5"
+        try:
+            # Initialize the diffusion pipeline
+            self.pipe = StableDiffusionPipeline.from_pretrained(
+                self.model_id,
+                torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
+                safety_checker=None,
+                requires_safety_checker=False
+            ).to(self.device)
+            # Use DDIM scheduler for better control
+            self.pipe.scheduler = DDIMScheduler.from_config(self.pipe.scheduler.config)
+            # CLIP model for guidance
+            self.clip_model = self.pipe.text_encoder
+            self.clip_tokenizer = self.pipe.tokenizer
+            print("SVGDreamer handler initialized successfully!")
+        except Exception as e:
+            print(f"Warning: Could not load diffusion model: {e}")
+            self.pipe = None
+            self.clip_model = None
+            self.clip_tokenizer = None
     def __call__(self, inputs: Union[str, Dict[str, Any]]) -> Image.Image:
         """
     def get_text_embeddings(self, prompt: str):
         """Get CLIP text embeddings for the prompt"""
+        if self.clip_model is None or self.clip_tokenizer is None:
+            # Return dummy embeddings if model not loaded
+            return torch.zeros((1, 77, 768))
+        try:
+            with torch.no_grad():
+                text_inputs = self.clip_tokenizer(
+                    prompt,
+                    padding="max_length",
+                    max_length=self.clip_tokenizer.model_max_length,
+                    truncation=True,
+                    return_tensors="pt"
+                ).to(self.device)
+                text_embeddings = self.clip_model(text_inputs.input_ids)[0]
+            return text_embeddings
+        except Exception as e:
+            print(f"Error getting text embeddings: {e}")
+            return torch.zeros((1, 77, 768))
     def extract_semantic_features(self, prompt: str):
         """Extract semantic features from prompt"""