Spaces:

grilledPotato
/

Linea

Runtime error

File size: 13,733 Bytes

import os
import torch
import vtracer
import tempfile
import cairosvg
import re
from PIL import Image
from datetime import datetime
import gc
import json 
import time
import queue
import threading

from flask import Flask, request, jsonify, send_from_directory, Response, stream_with_context
from flask_cors import CORS

from diffusers import StableDiffusionPipeline, LMSDiscreteScheduler
from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion import StableDiffusionPipelineOutput

import torchvision.transforms as transforms
from model import Generator 
from utils import process_svg

os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True" 

def setup_directories():
    os.makedirs(STROKES_DIR, exist_ok=True)
    os.makedirs(THUMBNAIL_DIR, exist_ok=True)
    print(f"Directories '{STROKES_DIR}' and '{THUMBNAIL_DIR}' are ready.")

def sanitize_filename(prompt):
    """Removes characters that are invalid for filenames."""
    s = re.sub(r'[\\/*?:"<>|]', "", prompt)
    return s[:100]

STROKES_DIR = os.path.join(os.getcwd(), 'strokes')
THUMBNAIL_DIR = os.path.join(os.getcwd(), 'thumbnails')
SKETCH_MODEL_WEIGHTS = os.path.join('checkpoints', 'netG_A_latest.pth')

class ImageToSvgPipeline:
    def __init__(self, sketch_model_path: str):
        self.device = "cuda" if torch.cuda.is_available() else "cpu"
        print(f"Using device: {self.device}")

        self._initialize_rinna_model()
        self._initialize_sketch_model(sketch_model_path)

    def _initialize_rinna_model(self):
        print("Loading Rinna Stable Diffusion model...")
        model_id = "rinna/japanese-stable-diffusion"

        self.rinna_pipe = StableDiffusionPipeline.from_pretrained(
            model_id,
            torch_dtype=torch.float16 if self.device == "cuda" else torch.float32,
        )
        self.rinna_pipe.scheduler = LMSDiscreteScheduler(
            beta_start=0.00085, beta_end=0.012, 
            beta_schedule="scaled_linear", num_train_timesteps=1000
        )
        self.rinna_pipe.tokenizer.model_max_length = 77
        self.rinna_pipe.to(self.device)
        self.rinna_pipe.set_progress_bar_config(disable=True)
        print("Rinna model loaded.")

    def unload_rinna_model(self):
        if hasattr(self, 'rinna_pipe'):
            print("Unloading Rinna Stable Diffusion model...")
            del self.rinna_pipe
            gc.collect()
            if self.device == "cuda":
                torch.cuda.empty_cache()
                print("GPU memory cache cleared.")
            print("Rinna model unloaded successfully.")
        else:
            print("Rinna model is not currently loaded.")

    def _initialize_sketch_model(self, model_path: str):
        print(f"Loading Sketch Generator model from {model_path}...")
        if not os.path.exists(model_path):
            raise FileNotFoundError(f"Sketch model weights not found at: {model_path}")

        self.sketch_model = Generator(input_nc=3, output_nc=1, n_residual_blocks=3)
        self.sketch_model.to(self.device)
        self.sketch_model.load_state_dict(torch.load(model_path, map_location=self.device))
        self.sketch_model.eval()

        self.sketch_transform = transforms.Compose([
            transforms.ToTensor(),
        ])
        print("Sketch model loaded.")

    def _generate_image(self, prompt: str, negative_prompt: str, steps: int = 30, callback=None) -> Image.Image:
        print(f"Generating image for prompt: '{prompt}'")
        with torch.no_grad():
            output: StableDiffusionPipelineOutput = self.rinna_pipe(
                prompt,
                negative_prompt=negative_prompt,
                num_inference_steps=steps,
                guidance_scale=7.5,
                width=720,
                height=720,
                callback_on_step_end=callback
            )
        return output.images[0]

    def _convert_to_sketch(self, image: Image.Image) -> Image.Image:
        print("Converting image to sketch...")
        with torch.no_grad():
            input_tensor = self.sketch_transform(image.convert("RGB")).unsqueeze(0).to(self.device)
            output_tensor = self.sketch_model(input_tensor)
            output_tensor = output_tensor.squeeze(0).cpu()
            sketch_image = transforms.ToPILImage()(output_tensor)
        return sketch_image

    def _extract_svg(self, image: Image.Image) -> str:
        print("Extracting SVG from sketch...")
        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_file:
            image.save(tmp_file.name)
            tmp_path = tmp_file.name

        try:
            svg_output_path = tmp_path.replace(".png", ".svg")
            vtracer.convert_image_to_svg_py(tmp_path, svg_output_path)
            with open(svg_output_path, 'r', encoding='utf-8') as f:
                svg_data = f.read()
        finally:
            if os.path.exists(tmp_path): os.remove(tmp_path)
            if 'svg_output_path' in locals() and os.path.exists(svg_output_path): os.remove(svg_output_path)

        print("SVG extraction complete.")
        return svg_data

    def process(self, prompt: str, img_path: str, negative_prompt: str, callback=None):
        """Processes the image generation and conversion, with progress callbacks."""
        def _callback(progress, step_name):
            if callback:
                callback(progress, step_name)
        
        generated_img = None
        if img_path is None:
            total_diffusion_steps = 30
            
            def diffusion_callback(pipe, step_index, timestep, callback_kwargs):
                progress = int(5 + ((step_index + 1) / total_diffusion_steps) * 75)
                _callback(progress, "Generating image...")
                return callback_kwargs

            _callback(5, "Starting image generation...")
            generated_img = self._generate_image(
                prompt, 
                negative_prompt, 
                steps=total_diffusion_steps, 
                callback=diffusion_callback
            )
            gc.collect()
            torch.cuda.empty_cache()
            _callback(80, "Base image generated.")
            img_to_process = generated_img
        else:
            generated_img = Image.open(img_path)
            img_to_process = generated_img
            _callback(80, "Image loaded.")

        _callback(85, "Converting to sketch...")
        sketch_image = self._convert_to_sketch(img_to_process)
        
        _callback(90, "Vectorizing sketch...")
        svg_content = self._extract_svg(sketch_image)
        _callback(95, "SVG extracted.")

        return svg_content, generated_img


app = Flask(__name__)
CORS(app, resources={r"/*": {"origins": "*"}})
pipeline = ImageToSvgPipeline(sketch_model_path=SKETCH_MODEL_WEIGHTS)

@app.after_request
def add_ngrok_header(response):
    response.headers['ngrok-skip-browser-warning'] = 'true'
    return response

@app.route('/generate', methods=['GET'])
def generate_stroke():
    prompt = request.args.get('prompt')
    if not prompt:
        return jsonify({"error": "Prompt is required"}), 400

    negative_prompt = (
        "低品質、最悪の品質、奇形、醜い、ぼやけている、ぼやけた、"
        "ウォーターマーク、署名、テキスト、フレームから外れた、"
        "手足が切れている、クロップされた、被写体が切り取られている、"
        "構成が悪い、焦点が合っていない"
    )

    q = queue.Queue()

    def worker():
        """Runs the long-running task in a separate thread and puts progress into the queue."""
        start_time = time.time()
        
        def progress_callback(progress, step):
            print(f"Progress: {progress}% - {step}")
            data = json.dumps({"progress": progress, "step": step})
            q.put(data)

        try:
            progress_callback(5, "Initializing...")
            
            svg_result, generated_image = pipeline.process(prompt, None, negative_prompt, callback=progress_callback)
            
            progress_callback(98, "Finalizing and saving...")
            
            timestamp = datetime.now().strftime("%Y%m%d%H%M%S")
            safe_prompt = sanitize_filename(prompt)[:60]
            filename_base = f"{timestamp}_{safe_prompt}"
            
            stroke_path = os.path.join(STROKES_DIR, f"{filename_base}.json")
            stroke = process_svg(svg_result, "file")
            with open(stroke_path, 'w', encoding='utf-8') as f:
                json.dump(stroke, f, ensure_ascii=False, indent=2)

            if generated_image:
                thumbnail_path = os.path.join(THUMBNAIL_DIR, f"{filename_base}.png")
                cairosvg.svg2png(bytestring=svg_result.encode('utf-8'), write_to=thumbnail_path, output_width=256, output_height=256)

            final_data = json.dumps({"progress": 100, "result": stroke, "step": "Complete!"})
            q.put(final_data)
            end_time = time.time()
            print(f"Total generation time: {end_time - start_time:.2f} seconds")

        except Exception as e:
            print(f"Error during generation stream: {e}")
            error_data = json.dumps({"error": str(e), "progress": 100})
            q.put(error_data)
        finally:
            q.put(None)

    threading.Thread(target=worker).start()

    def generate():
        """This generator reads from the queue and yields data to the client."""
        while True:
            item = q.get()
            if item is None:
                break
            yield f"data: {item}\n\n"

    return Response(stream_with_context(generate()), mimetype='text/event-stream')


@app.route('/gallery', methods=['GET'])
def get_gallery():
    try:
        page = int(request.args.get('page', 1))
        limit = int(request.args.get('limit', 8))

        strokes_files = sorted([f for f in os.listdir(STROKES_DIR) if f.endswith('.json')], reverse=True)
        start_index = (page - 1) * limit
        end_index = start_index + limit
        paginated_files = strokes_files[start_index:end_index]

        drawings = []
        for filename in paginated_files:
            prompt_match = re.match(r"\d+_(.+)\.json", filename)
            prompt = prompt_match.group(1).replace('_', ' ') if prompt_match else "Prompt not found"
            drawings.append({
                "filename": filename,
                "thumbnail": f"/thumbnails/{filename.replace('.json', '.png')}",
                "prompt": prompt
            })

        has_more = end_index < len(strokes_files)
        return jsonify({"drawings": drawings, "hasMore": has_more})
    except Exception as e:
        print(f"Error fetching gallery: {e}")
        return jsonify({"error": "Failed to fetch gallery"}), 500

@app.route('/add_svg', methods=['POST'])
def add_svg():
    data = request.json
    folder_path = data.get('folderPath').strip()
    count = 0
    for file in os.listdir(folder_path):
        file_path = os.path.join(folder_path, file)
        stroke_path = os.path.join(STROKES_DIR, file.replace('.svg', '.json'))
        stroke = process_svg(file_path, "path")
        with open(stroke_path, 'w', encoding='utf-8') as f:
            json.dump(stroke, f, ensure_ascii=False, indent=2)
        thumbnail_path = os.path.join(THUMBNAIL_DIR, file.replace('.svg', '.png'))
        cairosvg.svg2png(url=file_path, write_to=thumbnail_path, output_width=256, output_height=256)
        count += 1
    return jsonify({"status": "success", "message": f"Processed {count} SVG files."})

@app.route('/add_img', methods=['POST'])
def add_img():
    data = request.json
    folder_path = data.get('folderPath').strip()
    count = 0
    pipeline.unload_rinna_model()
    for file in os.listdir(folder_path):
        file_path = os.path.join(folder_path, file)
        svg_result, _ = pipeline.process(None, file_path, None)
        timestamp = datetime.now().strftime("%Y%m%d%H%M%S")
        filename = f"{timestamp}_{file.replace('.jpg', '.json').replace('.png', '.json')}"
        stroke_path = os.path.join(STROKES_DIR, filename)
        stroke = process_svg(svg_result, "file")
        with open(stroke_path, 'w', encoding='utf-8') as f:
            json.dump(stroke, f, ensure_ascii=False, indent=2)
        thumbnail_path = os.path.join(THUMBNAIL_DIR, filename.replace('.json', '.png'))
        cairosvg.svg2png(bytestring=svg_result.encode('utf-8'), write_to=thumbnail_path, output_width=256, output_height=256)
        count += 1
    pipeline._initialize_rinna_model()
    return jsonify({"status": "success", "message": f"Processed {count} image files."})

@app.route('/strokes/<path:filename>')
def get_strokes(filename):
    return send_from_directory(STROKES_DIR, filename)

@app.route('/thumbnails/<path:filename>')
def get_thumbnail(filename):
    return send_from_directory(THUMBNAIL_DIR, filename)

@app.route('/drawings/<path:filename>', methods=['DELETE'])
def delete_drawing_file(filename):
    try:
        json_path = os.path.join(STROKES_DIR, filename)
        thumb_path = os.path.join(THUMBNAIL_DIR, filename.replace('.json', '.png'))
        if os.path.exists(json_path): os.remove(json_path)
        if os.path.exists(thumb_path): os.remove(thumb_path)
        return jsonify({"message": f"Successfully deleted {filename}"})
    except Exception as e:
        print(f"Error deleting file: {e}")
        return jsonify({"error": "Failed to delete file"}), 500

app.mount("/strokes", StaticFiles(directory=STROKES_DIR), name="strokes")
app.mount("/thumbnails", StaticFiles(directory=THUMBNAIL_DIR), name="thumbnails")


if __name__ == '__main__':
    print("Starting FastAPI server...")
    uvicorn.run(app, host='0.0.0.0', port=7860)