Linea / app.py
potato
remove diffusion model's default pbar, add callback function
8da5801
import os
import torch
import vtracer
import tempfile
import cairosvg
import re
from PIL import Image
from datetime import datetime
import gc
import json
import time
import queue
import threading
from flask import Flask, request, jsonify, send_from_directory, Response, stream_with_context
from flask_cors import CORS
from diffusers import StableDiffusionPipeline, LMSDiscreteScheduler
from diffusers.pipelines.stable_diffusion.pipeline_stable_diffusion import StableDiffusionPipelineOutput
import torchvision.transforms as transforms
from model import Generator
from utils import process_svg
os.environ["PYTORCH_CUDA_ALLOC_CONF"] = "expandable_segments:True"
def setup_directories():
os.makedirs(STROKES_DIR, exist_ok=True)
os.makedirs(THUMBNAIL_DIR, exist_ok=True)
print(f"Directories '{STROKES_DIR}' and '{THUMBNAIL_DIR}' are ready.")
def sanitize_filename(prompt):
"""Removes characters that are invalid for filenames."""
s = re.sub(r'[\\/*?:"<>|]', "", prompt)
return s[:100]
STROKES_DIR = os.path.join(os.getcwd(), 'strokes')
THUMBNAIL_DIR = os.path.join(os.getcwd(), 'thumbnails')
SKETCH_MODEL_WEIGHTS = os.path.join('checkpoints', 'netG_A_latest.pth')
class ImageToSvgPipeline:
def __init__(self, sketch_model_path: str):
self.device = "cuda" if torch.cuda.is_available() else "cpu"
print(f"Using device: {self.device}")
self._initialize_rinna_model()
self._initialize_sketch_model(sketch_model_path)
def _initialize_rinna_model(self):
print("Loading Rinna Stable Diffusion model...")
model_id = "rinna/japanese-stable-diffusion"
self.rinna_pipe = StableDiffusionPipeline.from_pretrained(
model_id,
torch_dtype=torch.float16 if self.device == "cuda" else torch.float32,
)
self.rinna_pipe.scheduler = LMSDiscreteScheduler(
beta_start=0.00085, beta_end=0.012,
beta_schedule="scaled_linear", num_train_timesteps=1000
)
self.rinna_pipe.tokenizer.model_max_length = 77
self.rinna_pipe.to(self.device)
self.rinna_pipe.set_progress_bar_config(disable=True)
print("Rinna model loaded.")
def unload_rinna_model(self):
if hasattr(self, 'rinna_pipe'):
print("Unloading Rinna Stable Diffusion model...")
del self.rinna_pipe
gc.collect()
if self.device == "cuda":
torch.cuda.empty_cache()
print("GPU memory cache cleared.")
print("Rinna model unloaded successfully.")
else:
print("Rinna model is not currently loaded.")
def _initialize_sketch_model(self, model_path: str):
print(f"Loading Sketch Generator model from {model_path}...")
if not os.path.exists(model_path):
raise FileNotFoundError(f"Sketch model weights not found at: {model_path}")
self.sketch_model = Generator(input_nc=3, output_nc=1, n_residual_blocks=3)
self.sketch_model.to(self.device)
self.sketch_model.load_state_dict(torch.load(model_path, map_location=self.device))
self.sketch_model.eval()
self.sketch_transform = transforms.Compose([
transforms.ToTensor(),
])
print("Sketch model loaded.")
def _generate_image(self, prompt: str, negative_prompt: str, steps: int = 30, callback=None) -> Image.Image:
print(f"Generating image for prompt: '{prompt}'")
with torch.no_grad():
output: StableDiffusionPipelineOutput = self.rinna_pipe(
prompt,
negative_prompt=negative_prompt,
num_inference_steps=steps,
guidance_scale=7.5,
width=720,
height=720,
callback_on_step_end=callback
)
return output.images[0]
def _convert_to_sketch(self, image: Image.Image) -> Image.Image:
print("Converting image to sketch...")
with torch.no_grad():
input_tensor = self.sketch_transform(image.convert("RGB")).unsqueeze(0).to(self.device)
output_tensor = self.sketch_model(input_tensor)
output_tensor = output_tensor.squeeze(0).cpu()
sketch_image = transforms.ToPILImage()(output_tensor)
return sketch_image
def _extract_svg(self, image: Image.Image) -> str:
print("Extracting SVG from sketch...")
with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp_file:
image.save(tmp_file.name)
tmp_path = tmp_file.name
try:
svg_output_path = tmp_path.replace(".png", ".svg")
vtracer.convert_image_to_svg_py(tmp_path, svg_output_path)
with open(svg_output_path, 'r', encoding='utf-8') as f:
svg_data = f.read()
finally:
if os.path.exists(tmp_path): os.remove(tmp_path)
if 'svg_output_path' in locals() and os.path.exists(svg_output_path): os.remove(svg_output_path)
print("SVG extraction complete.")
return svg_data
def process(self, prompt: str, img_path: str, negative_prompt: str, callback=None):
"""Processes the image generation and conversion, with progress callbacks."""
def _callback(progress, step_name):
if callback:
callback(progress, step_name)
generated_img = None
if img_path is None:
total_diffusion_steps = 30
def diffusion_callback(pipe, step_index, timestep, callback_kwargs):
progress = int(5 + ((step_index + 1) / total_diffusion_steps) * 75)
_callback(progress, "Generating image...")
return callback_kwargs
_callback(5, "Starting image generation...")
generated_img = self._generate_image(
prompt,
negative_prompt,
steps=total_diffusion_steps,
callback=diffusion_callback
)
gc.collect()
torch.cuda.empty_cache()
_callback(80, "Base image generated.")
img_to_process = generated_img
else:
generated_img = Image.open(img_path)
img_to_process = generated_img
_callback(80, "Image loaded.")
_callback(85, "Converting to sketch...")
sketch_image = self._convert_to_sketch(img_to_process)
_callback(90, "Vectorizing sketch...")
svg_content = self._extract_svg(sketch_image)
_callback(95, "SVG extracted.")
return svg_content, generated_img
app = Flask(__name__)
CORS(app, resources={r"/*": {"origins": "*"}})
pipeline = ImageToSvgPipeline(sketch_model_path=SKETCH_MODEL_WEIGHTS)
@app.after_request
def add_ngrok_header(response):
response.headers['ngrok-skip-browser-warning'] = 'true'
return response
@app.route('/generate', methods=['GET'])
def generate_stroke():
prompt = request.args.get('prompt')
if not prompt:
return jsonify({"error": "Prompt is required"}), 400
negative_prompt = (
"低品質、最悪の品質、奇形、醜い、ぼやけている、ぼやけた、"
"ウォーターマーク、署名、テキスト、フレームから外れた、"
"手足が切れている、クロップされた、被写体が切り取られている、"
"構成が悪い、焦点が合っていない"
)
q = queue.Queue()
def worker():
"""Runs the long-running task in a separate thread and puts progress into the queue."""
start_time = time.time()
def progress_callback(progress, step):
print(f"Progress: {progress}% - {step}")
data = json.dumps({"progress": progress, "step": step})
q.put(data)
try:
progress_callback(5, "Initializing...")
svg_result, generated_image = pipeline.process(prompt, None, negative_prompt, callback=progress_callback)
progress_callback(98, "Finalizing and saving...")
timestamp = datetime.now().strftime("%Y%m%d%H%M%S")
safe_prompt = sanitize_filename(prompt)[:60]
filename_base = f"{timestamp}_{safe_prompt}"
stroke_path = os.path.join(STROKES_DIR, f"{filename_base}.json")
stroke = process_svg(svg_result, "file")
with open(stroke_path, 'w', encoding='utf-8') as f:
json.dump(stroke, f, ensure_ascii=False, indent=2)
if generated_image:
thumbnail_path = os.path.join(THUMBNAIL_DIR, f"{filename_base}.png")
cairosvg.svg2png(bytestring=svg_result.encode('utf-8'), write_to=thumbnail_path, output_width=256, output_height=256)
final_data = json.dumps({"progress": 100, "result": stroke, "step": "Complete!"})
q.put(final_data)
end_time = time.time()
print(f"Total generation time: {end_time - start_time:.2f} seconds")
except Exception as e:
print(f"Error during generation stream: {e}")
error_data = json.dumps({"error": str(e), "progress": 100})
q.put(error_data)
finally:
q.put(None)
threading.Thread(target=worker).start()
def generate():
"""This generator reads from the queue and yields data to the client."""
while True:
item = q.get()
if item is None:
break
yield f"data: {item}\n\n"
return Response(stream_with_context(generate()), mimetype='text/event-stream')
@app.route('/gallery', methods=['GET'])
def get_gallery():
try:
page = int(request.args.get('page', 1))
limit = int(request.args.get('limit', 8))
strokes_files = sorted([f for f in os.listdir(STROKES_DIR) if f.endswith('.json')], reverse=True)
start_index = (page - 1) * limit
end_index = start_index + limit
paginated_files = strokes_files[start_index:end_index]
drawings = []
for filename in paginated_files:
prompt_match = re.match(r"\d+_(.+)\.json", filename)
prompt = prompt_match.group(1).replace('_', ' ') if prompt_match else "Prompt not found"
drawings.append({
"filename": filename,
"thumbnail": f"/thumbnails/{filename.replace('.json', '.png')}",
"prompt": prompt
})
has_more = end_index < len(strokes_files)
return jsonify({"drawings": drawings, "hasMore": has_more})
except Exception as e:
print(f"Error fetching gallery: {e}")
return jsonify({"error": "Failed to fetch gallery"}), 500
@app.route('/add_svg', methods=['POST'])
def add_svg():
data = request.json
folder_path = data.get('folderPath').strip()
count = 0
for file in os.listdir(folder_path):
file_path = os.path.join(folder_path, file)
stroke_path = os.path.join(STROKES_DIR, file.replace('.svg', '.json'))
stroke = process_svg(file_path, "path")
with open(stroke_path, 'w', encoding='utf-8') as f:
json.dump(stroke, f, ensure_ascii=False, indent=2)
thumbnail_path = os.path.join(THUMBNAIL_DIR, file.replace('.svg', '.png'))
cairosvg.svg2png(url=file_path, write_to=thumbnail_path, output_width=256, output_height=256)
count += 1
return jsonify({"status": "success", "message": f"Processed {count} SVG files."})
@app.route('/add_img', methods=['POST'])
def add_img():
data = request.json
folder_path = data.get('folderPath').strip()
count = 0
pipeline.unload_rinna_model()
for file in os.listdir(folder_path):
file_path = os.path.join(folder_path, file)
svg_result, _ = pipeline.process(None, file_path, None)
timestamp = datetime.now().strftime("%Y%m%d%H%M%S")
filename = f"{timestamp}_{file.replace('.jpg', '.json').replace('.png', '.json')}"
stroke_path = os.path.join(STROKES_DIR, filename)
stroke = process_svg(svg_result, "file")
with open(stroke_path, 'w', encoding='utf-8') as f:
json.dump(stroke, f, ensure_ascii=False, indent=2)
thumbnail_path = os.path.join(THUMBNAIL_DIR, filename.replace('.json', '.png'))
cairosvg.svg2png(bytestring=svg_result.encode('utf-8'), write_to=thumbnail_path, output_width=256, output_height=256)
count += 1
pipeline._initialize_rinna_model()
return jsonify({"status": "success", "message": f"Processed {count} image files."})
@app.route('/strokes/<path:filename>')
def get_strokes(filename):
return send_from_directory(STROKES_DIR, filename)
@app.route('/thumbnails/<path:filename>')
def get_thumbnail(filename):
return send_from_directory(THUMBNAIL_DIR, filename)
@app.route('/drawings/<path:filename>', methods=['DELETE'])
def delete_drawing_file(filename):
try:
json_path = os.path.join(STROKES_DIR, filename)
thumb_path = os.path.join(THUMBNAIL_DIR, filename.replace('.json', '.png'))
if os.path.exists(json_path): os.remove(json_path)
if os.path.exists(thumb_path): os.remove(thumb_path)
return jsonify({"message": f"Successfully deleted {filename}"})
except Exception as e:
print(f"Error deleting file: {e}")
return jsonify({"error": "Failed to delete file"}), 500
app.mount("/strokes", StaticFiles(directory=STROKES_DIR), name="strokes")
app.mount("/thumbnails", StaticFiles(directory=THUMBNAIL_DIR), name="thumbnails")
if __name__ == '__main__':
print("Starting FastAPI server...")
uvicorn.run(app, host='0.0.0.0', port=7860)