| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
| |
|
|
| import gc |
| import random |
| import unittest |
|
|
| import torch |
|
|
| from diffusers import IFImg2ImgPipeline |
| from diffusers.models.attention_processor import AttnAddedKVProcessor |
| from diffusers.utils.import_utils import is_xformers_available |
|
|
| from ...testing_utils import ( |
| backend_empty_cache, |
| backend_max_memory_allocated, |
| backend_reset_max_memory_allocated, |
| backend_reset_peak_memory_stats, |
| floats_tensor, |
| load_numpy, |
| require_accelerator, |
| require_hf_hub_version_greater, |
| require_torch_accelerator, |
| require_transformers_version_greater, |
| skip_mps, |
| slow, |
| torch_device, |
| ) |
| from ..pipeline_params import ( |
| TEXT_GUIDED_IMAGE_VARIATION_BATCH_PARAMS, |
| TEXT_GUIDED_IMAGE_VARIATION_PARAMS, |
| ) |
| from ..test_pipelines_common import PipelineTesterMixin, assert_mean_pixel_difference |
| from . import IFPipelineTesterMixin |
|
|
|
|
| @skip_mps |
| class IFImg2ImgPipelineFastTests(PipelineTesterMixin, IFPipelineTesterMixin, unittest.TestCase): |
| pipeline_class = IFImg2ImgPipeline |
| params = TEXT_GUIDED_IMAGE_VARIATION_PARAMS - {"width", "height"} |
| batch_params = TEXT_GUIDED_IMAGE_VARIATION_BATCH_PARAMS |
| required_optional_params = PipelineTesterMixin.required_optional_params - {"latents"} |
|
|
| def get_dummy_components(self): |
| return self._get_dummy_components() |
|
|
| def get_dummy_inputs(self, device, seed=0): |
| if str(device).startswith("mps"): |
| generator = torch.manual_seed(seed) |
| else: |
| generator = torch.Generator(device=device).manual_seed(seed) |
|
|
| image = floats_tensor((1, 3, 32, 32), rng=random.Random(seed)).to(device) |
|
|
| inputs = { |
| "prompt": "A painting of a squirrel eating a burger", |
| "image": image, |
| "generator": generator, |
| "num_inference_steps": 2, |
| "output_type": "np", |
| } |
|
|
| return inputs |
|
|
| @unittest.skipIf( |
| torch_device != "cuda" or not is_xformers_available(), |
| reason="XFormers attention is only available with CUDA and `xformers` installed", |
| ) |
| def test_xformers_attention_forwardGenerator_pass(self): |
| self._test_xformers_attention_forwardGenerator_pass(expected_max_diff=1e-3) |
|
|
| @unittest.skipIf(torch_device not in ["cuda", "xpu"], reason="float16 requires CUDA or XPU") |
| @require_accelerator |
| def test_save_load_float16(self): |
| |
| super().test_save_load_float16(expected_max_diff=1e-1) |
|
|
| @unittest.skipIf(torch_device not in ["cuda", "xpu"], reason="float16 requires CUDA or XPU") |
| @require_accelerator |
| def test_float16_inference(self): |
| super().test_float16_inference(expected_max_diff=1e-1) |
|
|
| def test_attention_slicing_forward_pass(self): |
| self._test_attention_slicing_forward_pass(expected_max_diff=1e-2) |
|
|
| def test_save_load_local(self): |
| self._test_save_load_local() |
|
|
| def test_inference_batch_single_identical(self): |
| self._test_inference_batch_single_identical( |
| expected_max_diff=1e-2, |
| ) |
|
|
| @require_hf_hub_version_greater("0.26.5") |
| @require_transformers_version_greater("4.47.1") |
| def test_save_load_dduf(self): |
| super().test_save_load_dduf(atol=1e-2, rtol=1e-2) |
|
|
| @unittest.skip("Functionality is tested elsewhere.") |
| def test_save_load_optional_components(self): |
| pass |
|
|
|
|
| @slow |
| @require_torch_accelerator |
| class IFImg2ImgPipelineSlowTests(unittest.TestCase): |
| def setUp(self): |
| |
| super().setUp() |
| gc.collect() |
| backend_empty_cache(torch_device) |
|
|
| def tearDown(self): |
| |
| super().tearDown() |
| gc.collect() |
| backend_empty_cache(torch_device) |
|
|
| def test_if_img2img(self): |
| pipe = IFImg2ImgPipeline.from_pretrained( |
| "DeepFloyd/IF-I-L-v1.0", |
| variant="fp16", |
| torch_dtype=torch.float16, |
| ) |
| pipe.unet.set_attn_processor(AttnAddedKVProcessor()) |
| pipe.enable_model_cpu_offload(device=torch_device) |
|
|
| backend_reset_max_memory_allocated(torch_device) |
| backend_empty_cache(torch_device) |
| backend_reset_peak_memory_stats(torch_device) |
|
|
| image = floats_tensor((1, 3, 64, 64), rng=random.Random(0)).to(torch_device) |
| generator = torch.Generator(device="cpu").manual_seed(0) |
| output = pipe( |
| prompt="anime turtle", |
| image=image, |
| num_inference_steps=2, |
| generator=generator, |
| output_type="np", |
| ) |
| image = output.images[0] |
|
|
| mem_bytes = backend_max_memory_allocated(torch_device) |
| assert mem_bytes < 12 * 10**9 |
|
|
| expected_image = load_numpy( |
| "https://huggingface.co/datasets/hf-internal-testing/diffusers-images/resolve/main/if/test_if_img2img.npy" |
| ) |
| assert_mean_pixel_difference(image, expected_image) |
|
|
| pipe.remove_all_hooks() |
|
|