File size: 13,437 Bytes
6e28688
cfec117
 
 
6e28688
 
 
 
 
cfec117
 
6e28688
 
 
 
fc4ba89
 
 
 
 
 
6e28688
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
727a4d5
6e28688
 
cfec117
6e28688
 
cfec117
6e28688
 
cfec117
6e28688
 
 
 
 
cfec117
 
6e28688
cfec117
 
fc4ba89
 
 
 
 
 
 
 
 
 
eb47665
08247fe
fc4ba89
 
08247fe
fc4ba89
 
eb47665
 
08247fe
fc4ba89
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
270f50f
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6e28688
 
 
270f50f
cfec117
6e28688
fd380f8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7e23f03
 
 
 
 
 
 
 
 
 
 
 
6e28688
 
 
 
727a4d5
 
 
 
 
 
fc4ba89
6e28688
 
270f50f
 
 
 
 
 
fc4ba89
 
 
270f50f
6e28688
 
270f50f
6e28688
 
 
 
fd380f8
 
 
 
 
6e28688
270f50f
6e28688
270f50f
 
 
6e28688
7e23f03
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
"""Notebook-style diffusers loader for BiliSakura Hub models."""

from __future__ import annotations

import gc
import inspect
import os
from pathlib import Path
from typing import Any, get_args, get_origin

import torch
from diffusers import DiffusionPipeline
import diffusers.pipelines.pipeline_utils as pipeline_utils
from huggingface_hub import snapshot_download

from model_catalog import (
    ModelProfile,
    get_profile,
    scheduler_choices_for_profile,
    uses_native_scheduler,
)


def _patch_diffusers_custom_pipeline_type_check() -> None:
    """Work around diffusers 0.36 KeyError when custom pipelines omit parsed annotations."""

    if getattr(pipeline_utils, "_bilisakura_type_check_patch", False):
        return

    @classmethod
    def patched_get_signature_types(cls):
        signature_types = {}
        for name, param in inspect.signature(cls.__init__).parameters.items():
            if name == "self":
                continue
            annotation = param.annotation
            if annotation is inspect.Parameter.empty:
                signature_types[name] = (inspect.Signature.empty,)
                continue
            origin = get_origin(annotation)
            if inspect.isclass(annotation):
                signature_types[name] = (annotation,)
            elif origin is not None:
                args = get_args(annotation)
                signature_types[name] = args if args else (annotation,)
            else:
                signature_types[name] = (inspect.Signature.empty,)
        return signature_types

    original_from_pretrained = DiffusionPipeline.from_pretrained.__func__

    @classmethod
    def from_pretrained_patched(cls, pretrained_model_name_or_path, *args, **kwargs):
        original_get_signature_types = DiffusionPipeline._get_signature_types
        DiffusionPipeline._get_signature_types = patched_get_signature_types
        try:
            return original_from_pretrained(cls, pretrained_model_name_or_path, *args, **kwargs)
        finally:
            DiffusionPipeline._get_signature_types = original_get_signature_types

    DiffusionPipeline.from_pretrained = from_pretrained_patched
    pipeline_utils._bilisakura_type_check_patch = True


_patch_diffusers_custom_pipeline_type_check()


LOCAL_MODELS_ROOT = Path(os.environ.get("LOCAL_MODELS_ROOT", "")).expanduser()
USE_LOCAL_MODELS = LOCAL_MODELS_ROOT.is_dir()
HF_ORG = os.environ.get("HF_MODEL_ORG", "BiliSakura")

class PipelineManager:
    def __init__(self) -> None:
        self._pipe: DiffusionPipeline | None = None
        self._loaded_label: str | None = None
        self._loaded_profile: ModelProfile | None = None
        self._on_cuda: bool = False

    @property
    def loaded_label(self) -> str | None:
        return self._loaded_label

    @property
    def loaded_profile(self) -> ModelProfile | None:
        return self._loaded_profile

    @property
    def pipe(self) -> DiffusionPipeline | None:
        return self._pipe

    def _resolve_model_source(self, profile: ModelProfile) -> tuple[str, str]:
        """Return local checkpoint path and a human-readable source label."""
        if USE_LOCAL_MODELS:
            local_path = LOCAL_MODELS_ROOT / profile.collection / profile.variant
            if local_path.is_dir():
                return str(local_path.resolve()), str(local_path)

        repo_id = profile.hub_repo
        cached_repo = snapshot_download(
            repo_id,
            repo_type="model",
            allow_patterns=[f"{profile.variant}/**"],
        )
        model_dir = Path(cached_repo) / profile.variant
        return str(model_dir.resolve()), f"{repo_id} (subfolder `{profile.variant}`)"

    def _resolve_dtype(self, profile: ModelProfile) -> torch.dtype:
        return torch.bfloat16 if profile.dtype == "bfloat16" else torch.float32

    def _apply_post_load(self, pipe: DiffusionPipeline) -> None:
        pipe.set_progress_bar_config(disable=True)

    def unload(self) -> None:
        if self._pipe is not None:
            del self._pipe
            self._pipe = None
        self._loaded_label = None
        self._loaded_profile = None
        self._on_cuda = False
        gc.collect()

    def move_to_cuda(self) -> None:
        if self._pipe is None or self._on_cuda:
            return
        self._pipe = self._pipe.to("cuda")
        self._on_cuda = True

    def load(self, collection: str, variant: str) -> tuple[str, ModelProfile]:
        profile = get_profile(collection, variant)
        label = profile.label
        if self._loaded_label == label and self._pipe is not None:
            return f"Model already loaded: `{label}`", profile

        self.unload()
        model_source, source_label = self._resolve_model_source(profile)
        dtype = self._resolve_dtype(profile)
        model_path = Path(model_source)

        load_kwargs: dict[str, Any] = {
            "trust_remote_code": True,
            "torch_dtype": dtype,
        }
        if profile.use_custom_pipeline:
            load_kwargs["custom_pipeline"] = str(model_path / "pipeline.py")

        if USE_LOCAL_MODELS and (LOCAL_MODELS_ROOT / profile.collection / profile.variant).is_dir():
            load_kwargs["local_files_only"] = True

        pipe = DiffusionPipeline.from_pretrained(model_source, **load_kwargs)
        self._apply_post_load(pipe)

        self._pipe = pipe
        self._loaded_label = label
        self._loaded_profile = profile
        self._on_cuda = False
        return f"Loaded `{label}` from `{source_label}`.", profile


PIPELINE_MANAGER = PipelineManager()


def current_scheduler_name(pipe: DiffusionPipeline) -> str:
    return type(pipe.scheduler).__name__


def scheduler_options_for_profile(profile: ModelProfile, pipe: DiffusionPipeline | None = None) -> tuple[list[str], str]:
    if uses_native_scheduler(profile):
        if pipe is not None:
            name = current_scheduler_name(pipe)
            return [name], name
        return ["checkpoint"], "checkpoint"

    swappable = scheduler_choices_for_profile(profile)
    if pipe is not None:
        loaded = current_scheduler_name(pipe)
        choices = list(swappable)
        if loaded not in choices:
            choices = [loaded, *choices]
        return choices, loaded

    return ["checkpoint", *swappable], "checkpoint"


def swap_scheduler(pipe: DiffusionPipeline, scheduler_name: str, profile: ModelProfile) -> None:
    if scheduler_name in {"", "checkpoint"}:
        return
    current = current_scheduler_name(pipe)
    if scheduler_name == current:
        return

    import diffusers

    if not hasattr(diffusers, scheduler_name):
        raise ValueError(f"Unknown diffusers scheduler: {scheduler_name}")

    scheduler_cls = getattr(diffusers, scheduler_name)
    extra_kwargs = profile.scheduler_kwargs if profile.scheduler == scheduler_name else {}
    pipe.scheduler = scheduler_cls.from_config(pipe.scheduler.config, **extra_kwargs)


def _to_int(value: Any, *, default: int = 0) -> int:
    if value is None:
        return default
    if isinstance(value, bool):
        return int(value)
    if isinstance(value, (int, float)):
        return int(value)
    text = str(value).strip()
    if not text:
        return default
    return int(float(text))


def _to_float(value: Any, *, default: float = 0.0) -> float:
    if value is None:
        return default
    if isinstance(value, (int, float)):
        return float(value)
    text = str(value).strip()
    if not text:
        return default
    return float(text)


def build_inference_steps(profile: ModelProfile, steps: Any) -> int | list[int]:
    steps = _to_int(steps, default=profile.default_steps)
    if profile.steps_are_list:
        per_stage = max(1, steps // 4)
        return [per_stage, per_stage, per_stage, per_stage]
    return steps


def _split_synonyms(label_text: str) -> list[str]:
    return [part.strip() for part in label_text.split(",") if part.strip()]


def _get_pipe_id2label(pipe: DiffusionPipeline) -> dict[int, str]:
    id2label: dict[int, str] | None = None
    if hasattr(pipe, "id2label"):
        raw = pipe.id2label
        if isinstance(raw, dict) and raw:
            id2label = {int(key): str(value) for key, value in raw.items()}
    if id2label is None:
        config = getattr(pipe, "config", None)
        raw = getattr(config, "id2label", None) if config is not None else None
        if isinstance(raw, dict) and raw:
            id2label = {int(key): str(value) for key, value in raw.items()}
    return id2label or {}


def _build_label2id(id2label: dict[int, str]) -> dict[str, int]:
    label2id: dict[str, int] = {}
    for class_id, value in id2label.items():
        synonyms = _split_synonyms(value)
        if not synonyms:
            continue
        for synonym in synonyms:
            label2id[synonym] = int(class_id)
        label2id[value.strip()] = int(class_id)
    return label2id


def resolve_class_labels(
    pipe: DiffusionPipeline,
    class_label: str,
    *,
    default: str,
) -> int | str:
    """Resolve a class name or id using the loaded model's id2label synonyms."""
    label = str(class_label or "").strip() or default
    if label.isdigit():
        return int(label)
    if label.replace(".", "", 1).isdigit():
        return int(float(label))

    id2label = _get_pipe_id2label(pipe)
    if not id2label:
        return label

    label2id = _build_label2id(id2label)
    if label in label2id:
        return label2id[label]

    for part in _split_synonyms(label):
        if part in label2id:
            return label2id[part]

    normalized = label.casefold()
    for class_id, value in id2label.items():
        if value.strip().casefold() == normalized:
            return int(class_id)
        for part in _split_synonyms(value):
            if part.casefold() == normalized:
                return int(class_id)

    if hasattr(pipe, "get_label_ids"):
        for candidate in _split_synonyms(label):
            try:
                return pipe.get_label_ids(candidate)[0]
            except (ValueError, TypeError):
                continue

    return label


def primary_label_for_id(pipe: DiffusionPipeline, class_id: int, *, fallback: str) -> str:
    """Return the first synonym from id2label for a class id."""
    id2label = _get_pipe_id2label(pipe)
    value = id2label.get(int(class_id))
    if not value:
        return fallback
    synonyms = _split_synonyms(value)
    return synonyms[0] if synonyms else fallback


def default_class_label_for_pipe(pipe: DiffusionPipeline, profile: ModelProfile) -> str:
    """Pick a sensible default label using id2label synonyms when available."""
    id2label = _get_pipe_id2label(pipe)
    if not id2label:
        return profile.default_class_label

    preferred_ids = (207, 285, 281)
    for class_id in preferred_ids:
        if class_id in id2label:
            return primary_label_for_id(pipe, class_id, fallback=profile.default_class_label)

    for value in id2label.values():
        for synonym in _split_synonyms(value):
            if synonym.casefold() == profile.default_class_label.casefold():
                return synonym

    first_value = next(iter(id2label.values()), profile.default_class_label)
    synonyms = _split_synonyms(first_value)
    return synonyms[0] if synonyms else profile.default_class_label


def _filter_call_kwargs(pipe: DiffusionPipeline, call_kwargs: dict[str, Any]) -> dict[str, Any]:
    """Drop kwargs that the pipeline __call__ does not accept (e.g. height/width for iMF/pMF)."""
    try:
        params = inspect.signature(pipe.__call__).parameters
    except (TypeError, ValueError):
        return call_kwargs
    if any(param.kind == inspect.Parameter.VAR_KEYWORD for param in params.values()):
        return call_kwargs
    accepted = set(params.keys())
    return {key: value for key, value in call_kwargs.items() if key in accepted}


def run_inference(
    profile: ModelProfile,
    pipe: DiffusionPipeline,
    *,
    class_label: str,
    seed: int,
    num_steps: int,
    guidance_scale: float,
    height: int,
    width: int,
    scheduler_name: str | None = None,
    extra_kwargs: dict[str, Any] | None = None,
) -> Any:
    seed = _to_int(seed, default=profile.default_seed)
    num_steps = _to_int(num_steps, default=profile.default_steps)
    guidance_scale = _to_float(guidance_scale, default=profile.default_guidance)
    height = _to_int(height, default=0)
    width = _to_int(width, default=0)

    if scheduler_name and not uses_native_scheduler(profile):
        swap_scheduler(pipe, str(scheduler_name), profile)

    generator = torch.Generator(device="cuda").manual_seed(seed)
    call_kwargs: dict[str, Any] = {
        "num_inference_steps": build_inference_steps(profile, num_steps),
        "guidance_scale": guidance_scale,
        "generator": generator,
    }
    call_kwargs.update(extra_kwargs if extra_kwargs is not None else profile.extra_call_kwargs)

    call_kwargs["class_labels"] = resolve_class_labels(
        pipe,
        class_label,
        default=profile.default_class_label,
    )

    native = profile.infer_resolution()
    if height > 0 and width > 0:
        if profile.collection != "ADM-diffusers" or height != native or width != native:
            call_kwargs["height"] = height
            call_kwargs["width"] = width

    return pipe(**_filter_call_kwargs(pipe, call_kwargs)).images[0]