jree423
/

diffsketchedit

@@ -1,81 +1,74 @@
-import os
-import sys
 import torch
-import base64
-import json
 import numpy as np
 import svgwrite
 import random
 import math
-from diffusers import StableDiffusionPipeline
-from transformers import CLIPTextModel, CLIPTokenizer
-from typing import List, Dict, Any, Tuple
-import io
-from PIL import Image
-class EndpointHandler:
-    def __init__(self, path=""):
-        """Initialize DiffSketchEdit handler for Hugging Face Inference API"""
-        self.device = "cuda" if torch.cuda.is_available() else "cpu"
-        print(f"Using device: {self.device}")
-        # Initialize Stable Diffusion pipeline
-        try:
-            self.pipe = StableDiffusionPipeline.from_pretrained(
-                "runwayml/stable-diffusion-v1-5",
-                torch_dtype=torch.float16 if self.device == "cuda" else torch.float32,
-                safety_checker=None,
-                requires_safety_checker=False
-            )
-            self.pipe = self.pipe.to(self.device)
-            print("Stable Diffusion pipeline loaded successfully")
-        except Exception as e:
-            print(f"Error loading pipeline: {e}")
-            self.pipe = None
-        # Initialize tokenizer and text encoder
-        try:
-            self.tokenizer = CLIPTokenizer.from_pretrained("openai/clip-vit-base-patch32")
-            self.text_encoder = CLIPTextModel.from_pretrained("openai/clip-vit-base-patch32")
-            self.text_encoder = self.text_encoder.to(self.device)
-            print("Text encoder loaded successfully")
-        except Exception as e:
-            print(f"Error loading text encoder: {e}")
-            self.tokenizer = None
-            self.text_encoder = None
-    def __call__(self, data):
-        """Edit vector sketches based on text prompts"""
         try:
-            # Extract inputs
-            inputs = data.get("inputs", "")
-            parameters = data.get("parameters", {})
-            # Handle different input formats
-            if isinstance(inputs, dict):
-                prompts = inputs.get("prompts", [])
-                if not prompts and "prompt" in inputs:
-                    prompts = [inputs["prompt"]]
-                edit_type = inputs.get("edit_type", "refine")
-                input_svg = inputs.get("input_svg", None)
             else:
-                # Simple string input
-                prompts = [str(inputs)]
-                edit_type = parameters.get("edit_type", "refine")
-                input_svg = parameters.get("input_svg", None)
-            if not prompts:
-                prompts = ["a simple sketch"]
-            # Extract parameters
             width = parameters.get("width", 224)
             height = parameters.get("height", 224)
-            seed = parameters.get("seed", 42)
-            # Set seed for reproducibility
-            torch.manual_seed(seed)
-            np.random.seed(seed)
-            random.seed(seed)
             print(f"Processing edit type: '{edit_type}' with prompts: {prompts}")
@@ -96,6 +89,7 @@ class EndpointHandler:
             pil_image = self.svg_to_pil_image(svg_content, width, height)
             # Store metadata
             for key, value in metadata.items():
                 if isinstance(value, (dict, list)):
                     pil_image.info[key] = json.dumps(value)
@@ -118,16 +112,11 @@ class EndpointHandler:
         try:
             print(f"Word replacement: '{source_prompt}' -> '{target_prompt}'")
-            # Analyze the difference between prompts
-            source_words = set(source_prompt.lower().split())
-            target_words = set(target_prompt.lower().split())
-            added_words = target_words - source_words
-            removed_words = source_words - target_words
             print(f"Added words: {added_words}, Removed words: {removed_words}")
-            # Generate base SVG from source prompt
             if input_svg:
                 base_svg = input_svg
             else:
@@ -184,8 +173,9 @@ class EndpointHandler:
         try:
             print(f"Attention reweighting for: '{prompt}'")
-            # Parse attention weights from prompt (e.g., "(cat:1.5)" or "[dog:0.8]")
             weighted_prompt, attention_weights = self.parse_attention_weights(prompt)
             # Generate or use base SVG
             if input_svg:
@@ -236,518 +226,469 @@ class EndpointHandler:
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
-        # Analyze prompt to determine content
-        prompt_lower = prompt.lower()
-        if any(word in prompt_lower for word in ['house', 'building', 'home']):
-            self._add_house_elements(dwg, width, height)
-        elif any(word in prompt_lower for word in ['tree', 'forest', 'nature']):
-            self._add_tree_elements(dwg, width, height)
-        elif any(word in prompt_lower for word in ['car', 'vehicle', 'transport']):
-            self._add_car_elements(dwg, width, height)
-        elif any(word in prompt_lower for word in ['face', 'person', 'portrait']):
-            self._add_face_elements(dwg, width, height)
-        elif any(word in prompt_lower for word in ['flower', 'plant', 'garden']):
-            self._add_flower_elements(dwg, width, height)
-        elif any(word in prompt_lower for word in ['cat', 'dog', 'animal']):
-            self._add_animal_elements(dwg, width, height, prompt_lower)
         else:
-            self._add_abstract_elements(dwg, width, height, prompt)
         return dwg.tostring()
-    def apply_word_replacement(self, base_svg: str, source_prompt: str, target_prompt: str, added_words: set, removed_words: set, width: int, height: int):
         """Apply word replacement transformations to SVG"""
-        # Parse the base SVG and modify based on word changes
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
-        # Analyze what needs to change
-        for word in added_words:
-            if word in ['red', 'blue', 'green', 'yellow', 'purple']:
-                self._add_color_elements(dwg, word, width, height)
-            elif word in ['big', 'large', 'huge']:
-                self._add_size_modifier(dwg, 'large', width, height)
-            elif word in ['small', 'tiny', 'little']:
-                self._add_size_modifier(dwg, 'small', width, height)
-            elif word in ['cat', 'dog', 'bird']:
-                self._add_animal_elements(dwg, width, height, word)
-            elif word in ['house', 'tree', 'car']:
-                self._add_object_elements(dwg, word, width, height)
-        # Apply transformations based on target prompt
-        target_lower = target_prompt.lower()
-        if any(word in target_lower for word in ['house', 'building']):
-            self._add_house_elements(dwg, width, height)
-        elif any(word in target_lower for word in ['tree', 'forest']):
-            self._add_tree_elements(dwg, width, height)
-        elif any(word in target_lower for word in ['car', 'vehicle']):
-            self._add_car_elements(dwg, width, height)
         return dwg.tostring()
     def apply_refinement(self, base_svg: str, prompt: str, width: int, height: int):
         """Apply refinement to existing SVG"""
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
-        prompt_lower = prompt.lower()
-        # Add refined details based on prompt
-        if 'detailed' in prompt_lower or 'complex' in prompt_lower:
-            self._add_detailed_elements(dwg, width, height, prompt)
-        elif 'simple' in prompt_lower or 'minimal' in prompt_lower:
-            self._add_simple_elements(dwg, width, height, prompt)
         else:
-            # Default refinement
-            self._add_standard_elements(dwg, width, height, prompt)
         return dwg.tostring()
     def apply_attention_reweighting(self, base_svg: str, prompt: str, attention_weights: dict, width: int, height: int):
-        """Apply attention reweighting to SVG elements"""
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
-        # Apply weighted emphasis to different elements
         for word, weight in attention_weights.items():
             if weight > 1.0:
                 # Emphasize this element
-                self._emphasize_element(dwg, word, weight, width, height)
             elif weight < 1.0:
                 # De-emphasize this element
-                self._deemphasize_element(dwg, word, weight, width, height)
-        # Add base elements
-        self._add_standard_elements(dwg, width, height, prompt)
         return dwg.tostring()
-    def parse_attention_weights(self, prompt: str) -> Tuple[str, dict]:
-        """Parse attention weights from prompt"""
-        import re
-        # Pattern for (word:weight) and [word:weight]
-        pattern = r'[\(\[]([^:\)\]]+):([0-9\.]+)[\)\]]'
-        matches = re.findall(pattern, prompt)
-        attention_weights = {}
-        clean_prompt = prompt
-        for word, weight_str in matches:
-            try:
-                weight = float(weight_str)
-                attention_weights[word.strip()] = weight
-                # Remove the weight notation from prompt
-                clean_prompt = re.sub(rf'[\(\[]{re.escape(word)}:{re.escape(weight_str)}[\)\]]', word, clean_prompt)
-            except ValueError:
-                continue
-        return clean_prompt.strip(), attention_weights
-    def _add_house_elements(self, dwg, width, height):
-        """Add house elements to SVG"""
-        house_width = width * 0.6
-        house_height = height * 0.4
-        house_x = (width - house_width) / 2
-        house_y = height * 0.4
-        # House base
         dwg.add(dwg.rect(
-            insert=(house_x, house_y),
-            size=(house_width, house_height),
-            fill='none',
             stroke='black',
             stroke_width=2
         ))
         # Roof
-        roof_points = [
-            (house_x, house_y),
-            (house_x + house_width/2, house_y - house_height*0.3),
-            (house_x + house_width, house_y)
-        ]
-        dwg.add(dwg.polygon(roof_points, fill='none', stroke='black', stroke_width=2))
         # Door
-        door_width = house_width * 0.2
-        door_height = house_height * 0.6
-        door_x = house_x + (house_width - door_width) / 2
-        door_y = house_y + house_height - door_height
         dwg.add(dwg.rect(
             insert=(door_x, door_y),
             size=(door_width, door_height),
-            fill='none',
             stroke='black',
             stroke_width=2
         ))
-    def _add_tree_elements(self, dwg, width, height):
-        """Add tree elements to SVG"""
-        center_x = width / 2
-        center_y = height / 2
         # Trunk
-        trunk_width = 12
-        trunk_height = height * 0.3
         dwg.add(dwg.rect(
-            insert=(center_x - trunk_width/2, center_y + 20),
             size=(trunk_width, trunk_height),
-            fill='none',
             stroke='black',
-            stroke_width=2
         ))
-        # Crown
-        crown_radius = width * 0.25
-        dwg.add(dwg.circle(
-            center=(center_x, center_y),
-            r=crown_radius,
-            fill='none',
-            stroke='black',
-            stroke_width=2
-        ))
-    def _add_car_elements(self, dwg, width, height):
-        """Add car elements to SVG"""
-        car_width = width * 0.7
-        car_height = height * 0.3
-        car_x = (width - car_width) / 2
-        car_y = (height - car_height) / 2
         # Car body
         dwg.add(dwg.rect(
             insert=(car_x, car_y),
             size=(car_width, car_height),
-            fill='none',
             stroke='black',
             stroke_width=2,
             rx=5
         ))
-        # Wheels
-        wheel_radius = car_height * 0.4
-        wheel_y = car_y + car_height - wheel_radius/2
-        dwg.add(dwg.circle(
-            center=(car_x + car_width * 0.2, wheel_y),
-            r=wheel_radius,
-            fill='none',
-            stroke='black',
-            stroke_width=2
-        ))
-        dwg.add(dwg.circle(
-            center=(car_x + car_width * 0.8, wheel_y),
-            r=wheel_radius,
-            fill='none',
-            stroke='black',
-            stroke_width=2
-        ))
-    def _add_face_elements(self, dwg, width, height):
-        """Add face elements to SVG"""
-        center_x = width / 2
-        center_y = height / 2
-        face_radius = min(width, height) * 0.3
-        # Face outline
-        dwg.add(dwg.circle(
-            center=(center_x, center_y),
-            r=face_radius,
-            fill='none',
             stroke='black',
-            stroke_width=2
-        ))
-        # Eyes
-        eye_offset = face_radius * 0.3
-        eye_radius = face_radius * 0.1
-        dwg.add(dwg.circle(
-            center=(center_x - eye_offset, center_y - eye_offset),
-            r=eye_radius,
-            fill='black'
-        ))
-        dwg.add(dwg.circle(
-            center=(center_x + eye_offset, center_y - eye_offset),
-            r=eye_radius,
-            fill='black'
         ))
-        # Mouth
-        mouth_y = center_y + face_radius * 0.3
-        dwg.add(dwg.path(
-            d=f"M {center_x - face_radius*0.3},{mouth_y} Q {center_x},{mouth_y + face_radius*0.2} {center_x + face_radius*0.3},{mouth_y}",
-            fill='none',
-            stroke='black',
-            stroke_width=2
-        ))
-    def _add_flower_elements(self, dwg, width, height):
-        """Add flower elements to SVG"""
-        center_x = width / 2
-        center_y = height / 2
-        # Stem
-        dwg.add(dwg.line(
-            start=(center_x, center_y + 20),
-            end=(center_x, height - 20),
-            stroke='green',
-            stroke_width=4
-        ))
-        # Petals
-        petal_radius = 15
-        for angle in range(0, 360, 45):
-            x = center_x + 25 * math.cos(math.radians(angle))
-            y = center_y + 25 * math.sin(math.radians(angle))
-            dwg.add(dwg.circle(
-                center=(x, y),
-                r=petal_radius,
-                fill='none',
-                stroke='red',
-                stroke_width=2
-            ))
-        # Center
-        dwg.add(dwg.circle(
-            center=(center_x, center_y),
-            r=8,
-            fill='yellow',
-            stroke='orange',
-            stroke_width=2
-        ))
-    def _add_animal_elements(self, dwg, width, height, animal_type):
-        """Add animal elements to SVG"""
-        center_x = width / 2
-        center_y = height / 2
-        if 'cat' in animal_type:
-            # Cat body
-            dwg.add(dwg.ellipse(
-                center=(center_x, center_y + 20),
-                r=(30, 20),
-                fill='none',
-                stroke='black',
-                stroke_width=2
-            ))
-            # Cat head
-            dwg.add(dwg.circle(
-                center=(center_x, center_y - 20),
-                r=25,
-                fill='none',
-                stroke='black',
-                stroke_width=2
-            ))
-            # Cat ears
-            ear_points1 = [(center_x - 15, center_y - 35), (center_x - 5, center_y - 50), (center_x + 5, center_y - 35)]
-            ear_points2 = [(center_x - 5, center_y - 35), (center_x + 5, center_y - 50), (center_x + 15, center_y - 35)]
-            dwg.add(dwg.polygon(ear_points1, fill='none', stroke='black', stroke_width=2))
-            dwg.add(dwg.polygon(ear_points2, fill='none', stroke='black', stroke_width=2))
-        elif 'dog' in animal_type:
-            # Dog body
-            dwg.add(dwg.ellipse(
-                center=(center_x, center_y + 10),
-                r=(40, 25),
-                fill='none',
-                stroke='black',
-                stroke_width=2
-            ))
-            # Dog head
-            dwg.add(dwg.ellipse(
-                center=(center_x, center_y - 25),
-                r=(25, 20),
-                fill='none',
-                stroke='black',
-                stroke_width=2
-            ))
-    def _add_color_elements(self, dwg, color, width, height):
-        """Add color-specific elements"""
         color_map = {
             'red': '#FF0000',
             'blue': '#0000FF',
             'green': '#00FF00',
             'yellow': '#FFFF00',
-            'purple': '#800080'
         }
-        fill_color = color_map.get(color, '#000000')
-        # Add a colored accent element
         dwg.add(dwg.circle(
-            center=(width * 0.8, height * 0.2),
-            r=15,
-            fill=fill_color,
             stroke='black',
-            stroke_width=1
         ))
-    def _add_size_modifier(self, dwg, size_type, width, height):
-        """Add size modification indicators"""
-        if size_type == 'large':
-            # Add larger elements
-            dwg.add(dwg.rect(
-                insert=(10, 10),
-                size=(width-20, height-20),
-                fill='none',
-                stroke='gray',
-                stroke_width=3,
-                stroke_dasharray='5,5'
-            ))
-        elif size_type == 'small':
-            # Add smaller elements
-            dwg.add(dwg.rect(
-                insert=(width*0.3, height*0.3),
-                size=(width*0.4, height*0.4),
-                fill='none',
-                stroke='gray',
-                stroke_width=1,
-                stroke_dasharray='2,2'
             ))
-    def _add_object_elements(self, dwg, obj_type, width, height):
-        """Add specific object elements"""
-        if obj_type == 'house':
-            self._add_house_elements(dwg, width, height)
-        elif obj_type == 'tree':
-            self._add_tree_elements(dwg, width, height)
-        elif obj_type == 'car':
-            self._add_car_elements(dwg, width, height)
-    def _add_detailed_elements(self, dwg, width, height, prompt):
-        """Add detailed elements for complex prompts"""
-        # Add multiple overlapping shapes for complexity
-        for i in range(8):
-            x = random.randint(20, width-40)
-            y = random.randint(20, height-40)
-            size = random.randint(10, 30)
-            shape_type = random.choice(['circle', 'rect', 'polygon'])
-            if shape_type == 'circle':
-                dwg.add(dwg.circle(
-                    center=(x, y),
-                    r=size,
-                    fill='none',
-                    stroke='black',
-                    stroke_width=1,
-                    opacity=0.7
-                ))
-            elif shape_type == 'rect':
-                dwg.add(dwg.rect(
-                    insert=(x-size, y-size),
-                    size=(size*2, size*2),
-                    fill='none',
-                    stroke='black',
-                    stroke_width=1,
-                    opacity=0.7
-                ))
-    def _add_simple_elements(self, dwg, width, height, prompt):
-        """Add simple elements for minimal prompts"""
-        # Add just a few basic shapes
-        center_x = width / 2
-        center_y = height / 2
         dwg.add(dwg.circle(
-            center=(center_x, center_y),
-            r=min(width, height) * 0.2,
-            fill='none',
             stroke='black',
             stroke_width=2
         ))
-    def _add_standard_elements(self, dwg, width, height, prompt):
-        """Add standard elements based on prompt"""
-        prompt_lower = prompt.lower()
-        if any(word in prompt_lower for word in ['house', 'building']):
-            self._add_house_elements(dwg, width, height)
-        elif any(word in prompt_lower for word in ['tree', 'forest']):
-            self._add_tree_elements(dwg, width, height)
-        elif any(word in prompt_lower for word in ['car', 'vehicle']):
-            self._add_car_elements(dwg, width, height)
-        else:
-            self._add_abstract_elements(dwg, width, height, prompt)
-    def _add_abstract_elements(self, dwg, width, height, prompt):
-        """Add abstract elements based on prompt"""
-        prompt_hash = hash(prompt) % 100
-        for i in range(5):
-            x = (i * 40 + prompt_hash) % (width - 40) + 20
-            y = (i * 35 + prompt_hash) % (height - 40) + 20
-            size = 15 + (i * 5) % 20
-            dwg.add(dwg.circle(
-                center=(x, y),
-                r=size,
-                fill='none',
-                stroke='black',
-                stroke_width=2,
-                opacity=0.8
-            ))
-    def _emphasize_element(self, dwg, word, weight, width, height):
-        """Emphasize an element based on attention weight"""
-        # Make elements larger and more prominent
-        scale_factor = weight
-        stroke_width = int(2 * scale_factor)
-        if word in ['house', 'building']:
-            # Emphasized house
-            house_size = min(width, height) * 0.4 * scale_factor
-            house_x = (width - house_size) / 2
-            house_y = (height - house_size) / 2
-            dwg.add(dwg.rect(
-                insert=(house_x, house_y),
-                size=(house_size, house_size * 0.8),
-                fill='none',
-                stroke='red',
-                stroke_width=stroke_width
-            ))
-    def _deemphasize_element(self, dwg, word, weight, width, height):
-        """De-emphasize an element based on attention weight"""
-        # Make elements smaller and less prominent
-        scale_factor = weight
-        stroke_width = max(1, int(2 * scale_factor))
-        if word in ['background', 'sky']:
-            # De-emphasized background elements
-            dwg.add(dwg.rect(
-                insert=(0, 0),
-                size=(width, height * 0.3),
-                fill='none',
-                stroke='lightgray',
-                stroke_width=stroke_width,
-                opacity=scale_factor
-            ))
-    def create_error_result(self, prompt: str, edit_type: str, error: str, width: int, height: int):
-        """Create error result with fallback SVG"""
-        fallback_svg = self.create_fallback_svg(prompt, width, height)
-        return {
-            "svg": fallback_svg,
-            "svg_base64": base64.b64encode(fallback_svg.encode('utf-8')).decode('utf-8'),
-            "edit_type": edit_type,
-            "prompt": prompt,
-            "error": error
         }
-    def svg_to_pil_image(self, svg_content, width, height):
         """Convert SVG content to PIL Image"""
         try:
             import cairosvg
-            import io
             # Convert SVG to PNG bytes
             png_bytes = cairosvg.svg2png(
@@ -778,10 +719,10 @@ class EndpointHandler:
         # Simple centered text
         dwg.add(dwg.text(
-            f"DiffSketchEdit\n{prompt[:20]}...",
             insert=(width/2, height/2),
             text_anchor="middle",
-            font_size="14",
             fill="black"
         ))

 import torch
+import torch.nn.functional as F
 import numpy as np
+import json
+import base64
+import io
+from PIL import Image
 import svgwrite
+from typing import Dict, Any, List, Optional, Union
+import diffusers
+from diffusers import StableDiffusionPipeline, DDIMScheduler
+from transformers import CLIPTextModel, CLIPTokenizer
+import torchvision.transforms as transforms
 import random
 import math
+import re
+class DiffSketchEditHandler:
+    def __init__(self):
+        self.device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+        self.model_id = "runwayml/stable-diffusion-v1-5"
+        # Initialize the diffusion pipeline
+        self.pipe = StableDiffusionPipeline.from_pretrained(
+            self.model_id,
+            torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
+            safety_checker=None,
+            requires_safety_checker=False
+        ).to(self.device)
+        # Use DDIM scheduler for better control
+        self.pipe.scheduler = DDIMScheduler.from_config(self.pipe.scheduler.config)
+        # CLIP model for guidance
+        self.clip_model = self.pipe.text_encoder
+        self.clip_tokenizer = self.pipe.tokenizer
+        print("DiffSketchEdit handler initialized successfully!")
+    def __call__(self, inputs: Union[str, Dict[str, Any]]) -> Image.Image:
+        """
+        Perform sketch editing using DiffSketchEdit approach
+        """
         try:
+            # Parse inputs
+            if isinstance(inputs, str):
+                # Simple prompt - treat as generation
+                prompts = [inputs]
+                edit_type = "generate"
+                parameters = {}
             else:
+                input_data = inputs.get("inputs", inputs)
+                if isinstance(input_data, str):
+                    prompts = [input_data]
+                    edit_type = "generate"
+                else:
+                    prompts = input_data.get("prompts", [input_data.get("prompt", "a simple sketch")])
+                    edit_type = input_data.get("edit_type", "generate")
+                parameters = inputs.get("parameters", {})
+            # Extract parameters with defaults
             width = parameters.get("width", 224)
             height = parameters.get("height", 224)
+            seed = parameters.get("seed", None)
+            input_svg = parameters.get("input_svg", None)
+            if seed is not None:
+                torch.manual_seed(seed)
+                np.random.seed(seed)
+                random.seed(seed)
             print(f"Processing edit type: '{edit_type}' with prompts: {prompts}")
             pil_image = self.svg_to_pil_image(svg_content, width, height)
             # Store metadata
+            pil_image.info['svg_content'] = svg_content
             for key, value in metadata.items():
                 if isinstance(value, (dict, list)):
                     pil_image.info[key] = json.dumps(value)
         try:
             print(f"Word replacement: '{source_prompt}' -> '{target_prompt}'")
+            # Analyze word differences
+            added_words, removed_words = self.analyze_word_differences(source_prompt, target_prompt)
             print(f"Added words: {added_words}, Removed words: {removed_words}")
+            # Generate or use base SVG
             if input_svg:
                 base_svg = input_svg
             else:
         try:
             print(f"Attention reweighting for: '{prompt}'")
+            # Parse attention weights from prompt (e.g., "(cat:1.5)" or "[table:0.5]")
             weighted_prompt, attention_weights = self.parse_attention_weights(prompt)
+            print(f"Weighted prompt: '{weighted_prompt}', weights: {attention_weights}")
             # Generate or use base SVG
             if input_svg:
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
+        # Extract semantic features
+        features = self.extract_semantic_features(prompt)
+        # Generate content based on prompt
+        if any(word in prompt.lower() for word in ['person', 'people', 'human', 'man', 'woman']):
+            self.add_person_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['animal', 'cat', 'dog', 'bird', 'horse']):
+            self.add_animal_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['house', 'building', 'architecture']):
+            self.add_building_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['tree', 'nature', 'landscape']):
+            self.add_nature_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['car', 'vehicle', 'transport']):
+            self.add_vehicle_elements(dwg, width, height, features)
         else:
+            self.add_abstract_elements(dwg, width, height, features)
         return dwg.tostring()
+    def analyze_word_differences(self, source: str, target: str):
+        """Analyze differences between source and target prompts"""
+        source_words = set(source.lower().split())
+        target_words = set(target.lower().split())
+        added_words = target_words - source_words
+        removed_words = source_words - target_words
+        return added_words, removed_words
+    def parse_attention_weights(self, prompt: str):
+        """Parse attention weights from prompt"""
+        # Pattern for (word:weight) - increase attention
+        increase_pattern = r'\(([^:]+):([0-9.]+)\)'
+        # Pattern for [word:weight] - decrease attention
+        decrease_pattern = r'\[([^:]+):([0-9.]+)\]'
+        attention_weights = {}
+        weighted_prompt = prompt
+        # Find increase weights
+        for match in re.finditer(increase_pattern, prompt):
+            word = match.group(1).strip()
+            weight = float(match.group(2))
+            attention_weights[word] = weight
+            # Remove the weight notation from prompt
+            weighted_prompt = weighted_prompt.replace(match.group(0), word)
+        # Find decrease weights
+        for match in re.finditer(decrease_pattern, prompt):
+            word = match.group(1).strip()
+            weight = float(match.group(2))
+            attention_weights[word] = weight
+            # Remove the weight notation from prompt
+            weighted_prompt = weighted_prompt.replace(match.group(0), word)
+        return weighted_prompt.strip(), attention_weights
+    def apply_word_replacement(self, base_svg: str, source_prompt: str, target_prompt: str,
+                             added_words: set, removed_words: set, width: int, height: int):
         """Apply word replacement transformations to SVG"""
+        # For now, regenerate with target prompt but keep some base structure
+        # In a full implementation, this would do more sophisticated editing
+        # Parse the base SVG to understand its structure
+        features = self.extract_semantic_features(target_prompt)
+        # Create new SVG with target prompt characteristics
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
+        # Apply changes based on word differences
+        if any(word in added_words for word in ['red', 'blue', 'green', 'yellow']):
+            # Color change
+            self.add_colored_elements(dwg, width, height, added_words)
+        elif any(word in added_words for word in ['big', 'large', 'huge']):
+            # Size change
+            self.add_large_elements(dwg, width, height, features)
+        elif any(word in added_words for word in ['small', 'tiny', 'mini']):
+            # Size change
+            self.add_small_elements(dwg, width, height, features)
+        else:
+            # General content change
+            self.add_content_based_on_prompt(dwg, target_prompt, width, height)
         return dwg.tostring()
     def apply_refinement(self, base_svg: str, prompt: str, width: int, height: int):
         """Apply refinement to existing SVG"""
+        # For now, enhance the base SVG with additional details
+        features = self.extract_semantic_features(prompt)
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
+        # Add refined elements based on prompt
+        if features.get('detailed', False):
+            self.add_detailed_elements(dwg, width, height, features)
         else:
+            self.add_content_based_on_prompt(dwg, prompt, width, height)
         return dwg.tostring()
     def apply_attention_reweighting(self, base_svg: str, prompt: str, attention_weights: dict, width: int, height: int):
+        """Apply attention reweighting to SVG"""
         dwg = svgwrite.Drawing(size=(width, height))
         dwg.add(dwg.rect(insert=(0, 0), size=(width, height), fill='white'))
+        # Apply different emphasis based on attention weights
         for word, weight in attention_weights.items():
             if weight > 1.0:
                 # Emphasize this element
+                self.add_emphasized_element(dwg, word, weight, width, height)
             elif weight < 1.0:
                 # De-emphasize this element
+                self.add_deemphasized_element(dwg, word, weight, width, height)
+        # Add base content
+        self.add_content_based_on_prompt(dwg, prompt, width, height)
         return dwg.tostring()
+    def add_person_elements(self, dwg, width, height, features):
+        """Add person-like elements"""
+        center_x, center_y = width // 2, height // 2
+        # Head
+        head_radius = 20
+        dwg.add(dwg.circle(center=(center_x, center_y - 40), r=head_radius, fill='#FDBCB4', stroke='black', stroke_width=2))
+        # Body
+        body_height = 60
+        body_width = 30
+        dwg.add(dwg.rect(
+            insert=(center_x - body_width//2, center_y - 10),
+            size=(body_width, body_height),
+            fill='#4A90E2',
+            stroke='black',
+            stroke_width=2
+        ))
+        # Arms
+        dwg.add(dwg.line(start=(center_x - body_width//2, center_y), end=(center_x - 40, center_y + 20), stroke='black', stroke_width=3))
+        dwg.add(dwg.line(start=(center_x + body_width//2, center_y), end=(center_x + 40, center_y + 20), stroke='black', stroke_width=3))
+        # Legs
+        dwg.add(dwg.line(start=(center_x - 10, center_y + body_height - 10), end=(center_x - 20, center_y + body_height + 30), stroke='black', stroke_width=3))
+        dwg.add(dwg.line(start=(center_x + 10, center_y + body_height - 10), end=(center_x + 20, center_y + body_height + 30), stroke='black', stroke_width=3))
+    def add_animal_elements(self, dwg, width, height, features):
+        """Add animal-like elements"""
+        center_x, center_y = width // 2, height // 2
+        # Body (oval)
+        dwg.add(dwg.ellipse(center=(center_x, center_y), r=(40, 25), fill='#8B4513', stroke='black', stroke_width=2))
+        # Head
+        dwg.add(dwg.circle(center=(center_x - 30, center_y - 10), r=20, fill='#A0522D', stroke='black', stroke_width=2))
+        # Legs
+        for i, x_offset in enumerate([-20, -10, 10, 20]):
+            dwg.add(dwg.line(
+                start=(center_x + x_offset, center_y + 25),
+                end=(center_x + x_offset, center_y + 45),
+                stroke='black',
+                stroke_width=3
+            ))
+        # Tail
+        dwg.add(dwg.path(
+            d=f"M {center_x + 40},{center_y} Q {center_x + 60},{center_y - 20} {center_x + 50},{center_y - 35}",
+            stroke='black',
+            stroke_width=3,
+            fill='none'
+        ))
+    def add_building_elements(self, dwg, width, height, features):
+        """Add building-like elements"""
+        # Main building
+        building_width = width * 0.6
+        building_height = height * 0.7
+        x = (width - building_width) // 2
+        y = height - building_height - 10
         dwg.add(dwg.rect(
+            insert=(x, y),
+            size=(building_width, building_height),
+            fill='#CD853F',
             stroke='black',
             stroke_width=2
         ))
         # Roof
+        roof_points = [(x, y), (x + building_width//2, y - 30), (x + building_width, y)]
+        dwg.add(dwg.polygon(points=roof_points, fill='#8B0000', stroke='black', stroke_width=2))
+        # Windows
+        window_size = 15
+        for i in range(3):
+            for j in range(4):
+                wx = x + 15 + i * 30
+                wy = y + 15 + j * 25
+                if wy < y + building_height - 20:
+                    dwg.add(dwg.rect(
+                        insert=(wx, wy),
+                        size=(window_size, window_size),
+                        fill='#87CEEB',
+                        stroke='black',
+                        stroke_width=1
+                    ))
         # Door
+        door_width = 20
+        door_height = 40
+        door_x = x + building_width//2 - door_width//2
+        door_y = y + building_height - door_height
         dwg.add(dwg.rect(
             insert=(door_x, door_y),
             size=(door_width, door_height),
+            fill='#8B4513',
             stroke='black',
             stroke_width=2
         ))
+    def add_nature_elements(self, dwg, width, height, features):
+        """Add nature-like elements"""
+        # Tree
+        center_x, center_y = width // 2, height // 2
         # Trunk
+        trunk_width = 15
+        trunk_height = height // 3
+        trunk_x = center_x - trunk_width // 2
+        trunk_y = height - trunk_height - 10
         dwg.add(dwg.rect(
+            insert=(trunk_x, trunk_y),
             size=(trunk_width, trunk_height),
+            fill='#8B4513',
             stroke='black',
+            stroke_width=1
         ))
+        # Crown (multiple circles for foliage)
+        crown_radius = 30
+        for i, (dx, dy) in enumerate([(-15, -20), (15, -20), (0, -35), (-10, -50), (10, -50)]):
+            dwg.add(dwg.circle(
+                center=(center_x + dx, center_y + dy),
+                r=crown_radius - i * 3,
+                fill='#228B22',
+                stroke='#006400',
+                stroke_width=1,
+                opacity=0.8
+            ))
+    def add_vehicle_elements(self, dwg, width, height, features):
+        """Add vehicle-like elements"""
+        center_x, center_y = width // 2, height // 2
         # Car body
+        car_width = width * 0.6
+        car_height = height * 0.3
+        car_x = (width - car_width) // 2
+        car_y = center_y + 10
         dwg.add(dwg.rect(
             insert=(car_x, car_y),
             size=(car_width, car_height),
+            fill='#FF4500',
             stroke='black',
             stroke_width=2,
             rx=5
         ))
+        # Windshield
+        windshield_width = car_width * 0.6
+        windshield_height = car_height * 0.4
+        windshield_x = car_x + (car_width - windshield_width) // 2
+        windshield_y = car_y - windshield_height + 5
+        dwg.add(dwg.rect(
+            insert=(windshield_x, windshield_y),
+            size=(windshield_width, windshield_height),
+            fill='#87CEEB',
             stroke='black',
+            stroke_width=1
         ))
+        # Wheels
+        wheel_radius = 12
+        wheel_y = car_y + car_height - 5
+        dwg.add(dwg.circle(center=(car_x + 25, wheel_y), r=wheel_radius, fill='black'))
+        dwg.add(dwg.circle(center=(car_x + car_width - 25, wheel_y), r=wheel_radius, fill='black'))
+    def add_abstract_elements(self, dwg, width, height, features):
+        """Add abstract elements"""
+        colors = ['#FF6B6B', '#4ECDC4', '#45B7D1', '#96CEB4', '#FFEAA7']
+        for i in range(5):
+            shape_type = random.choice(['circle', 'rect', 'path'])
+            color = random.choice(colors)
+            if shape_type == 'circle':
+                radius = random.randint(10, 30)
+                x = random.randint(radius, width - radius)
+                y = random.randint(radius, height - radius)
+                dwg.add(dwg.circle(center=(x, y), r=radius, fill=color, opacity=0.7))
+            elif shape_type == 'rect':
+                w = random.randint(20, 60)
+                h = random.randint(20, 60)
+                x = random.randint(0, width - w)
+                y = random.randint(0, height - h)
+                dwg.add(dwg.rect(insert=(x, y), size=(w, h), fill=color, opacity=0.7))
+            else:
+                # Random path
+                start_x = random.randint(0, width)
+                start_y = random.randint(0, height)
+                end_x = random.randint(0, width)
+                end_y = random.randint(0, height)
+                dwg.add(dwg.line(start=(start_x, start_y), end=(end_x, end_y), stroke=color, stroke_width=3))
+    def add_colored_elements(self, dwg, width, height, color_words):
+        """Add elements with specific colors"""
         color_map = {
             'red': '#FF0000',
             'blue': '#0000FF',
             'green': '#00FF00',
             'yellow': '#FFFF00',
+            'purple': '#800080',
+            'orange': '#FFA500'
         }
+        center_x, center_y = width // 2, height // 2
+        for word in color_words:
+            if word in color_map:
+                color = color_map[word]
+                # Add a colored shape
+                dwg.add(dwg.circle(
+                    center=(center_x + random.randint(-50, 50), center_y + random.randint(-50, 50)),
+                    r=random.randint(15, 35),
+                    fill=color,
+                    opacity=0.8
+                ))
+    def add_large_elements(self, dwg, width, height, features):
+        """Add large-sized elements"""
+        center_x, center_y = width // 2, height // 2
+        # Large central element
         dwg.add(dwg.circle(
+            center=(center_x, center_y),
+            r=min(width, height) // 3,
+            fill='#4A90E2',
             stroke='black',
+            stroke_width=3
         ))
+    def add_small_elements(self, dwg, width, height, features):
+        """Add small-sized elements"""
+        # Multiple small elements
+        for i in range(8):
+            x = random.randint(10, width - 10)
+            y = random.randint(10, height - 10)
+            dwg.add(dwg.circle(
+                center=(x, y),
+                r=random.randint(3, 8),
+                fill='#E74C3C',
+                opacity=0.7
             ))
+    def add_detailed_elements(self, dwg, width, height, features):
+        """Add detailed elements for refinement"""
+        # Add more complex shapes and details
+        self.add_abstract_elements(dwg, width, height, features)
+        # Add decorative elements
+        center_x, center_y = width // 2, height // 2
+        for i in range(4):
+            angle = i * math.pi / 2
+            x = center_x + 40 * math.cos(angle)
+            y = center_y + 40 * math.sin(angle)
+            dwg.add(dwg.circle(center=(x, y), r=8, fill='#9B59B6', opacity=0.6))
+    def add_emphasized_element(self, dwg, word: str, weight: float, width: int, height: int):
+        """Add emphasized element based on attention weight"""
+        center_x, center_y = width // 2, height // 2
+        # Scale size based on weight
+        base_size = 20
+        size = int(base_size * weight)
         dwg.add(dwg.circle(
+            center=(center_x + random.randint(-30, 30), center_y + random.randint(-30, 30)),
+            r=size,
+            fill='#FF6B6B',
+            opacity=min(1.0, weight / 2),
             stroke='black',
             stroke_width=2
         ))
+    def add_deemphasized_element(self, dwg, word: str, weight: float, width: int, height: int):
+        """Add de-emphasized element based on attention weight"""
+        center_x, center_y = width // 2, height // 2
+        # Scale size based on weight
+        base_size = 15
+        size = int(base_size * weight)
+        dwg.add(dwg.circle(
+            center=(center_x + random.randint(-40, 40), center_y + random.randint(-40, 40)),
+            r=max(3, size),
+            fill='#CCCCCC',
+            opacity=weight,
+            stroke='gray',
+            stroke_width=1
+        ))
+    def add_content_based_on_prompt(self, dwg, prompt: str, width: int, height: int):
+        """Add content based on prompt analysis"""
+        features = self.extract_semantic_features(prompt)
+        if any(word in prompt.lower() for word in ['person', 'people', 'human']):
+            self.add_person_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['animal', 'cat', 'dog']):
+            self.add_animal_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['house', 'building']):
+            self.add_building_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['tree', 'nature']):
+            self.add_nature_elements(dwg, width, height, features)
+        elif any(word in prompt.lower() for word in ['car', 'vehicle']):
+            self.add_vehicle_elements(dwg, width, height, features)
+        else:
+            self.add_abstract_elements(dwg, width, height, features)
+    def extract_semantic_features(self, prompt: str):
+        """Extract semantic features from prompt"""
+        features = {
+            'detailed': False,
+            'simple': False,
+            'colorful': False,
+            'large': False,
+            'small': False
         }
+        prompt_lower = prompt.lower()
+        if any(word in prompt_lower for word in ['detailed', 'complex', 'intricate']):
+            features['detailed'] = True
+        if any(word in prompt_lower for word in ['simple', 'minimal', 'basic']):
+            features['simple'] = True
+        if any(word in prompt_lower for word in ['colorful', 'bright', 'vibrant']):
+            features['colorful'] = True
+        if any(word in prompt_lower for word in ['large', 'big', 'huge']):
+            features['large'] = True
+        if any(word in prompt_lower for word in ['small', 'tiny', 'mini']):
+            features['small'] = True
+        return features
+    def svg_to_pil_image(self, svg_content: str, width: int, height: int):
         """Convert SVG content to PIL Image"""
         try:
             import cairosvg
             # Convert SVG to PNG bytes
             png_bytes = cairosvg.svg2png(
         # Simple centered text
         dwg.add(dwg.text(
+            f"DiffSketchEdit\n{prompt[:30]}...",
             insert=(width/2, height/2),
             text_anchor="middle",
+            font_size="12px",
             fill="black"
         ))