| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| | |
| |
|
| | import unittest |
| |
|
| | from diffusers import AutoencoderKLTemporalDecoder |
| |
|
| | from ...testing_utils import ( |
| | enable_full_determinism, |
| | floats_tensor, |
| | torch_device, |
| | ) |
| | from ..test_modeling_common import ModelTesterMixin |
| | from .testing_utils import AutoencoderTesterMixin |
| |
|
| |
|
| | enable_full_determinism() |
| |
|
| |
|
| | class AutoencoderKLTemporalDecoderTests(ModelTesterMixin, AutoencoderTesterMixin, unittest.TestCase): |
| | model_class = AutoencoderKLTemporalDecoder |
| | main_input_name = "sample" |
| | base_precision = 1e-2 |
| |
|
| | @property |
| | def dummy_input(self): |
| | batch_size = 3 |
| | num_channels = 3 |
| | sizes = (32, 32) |
| |
|
| | image = floats_tensor((batch_size, num_channels) + sizes).to(torch_device) |
| | num_frames = 3 |
| |
|
| | return {"sample": image, "num_frames": num_frames} |
| |
|
| | @property |
| | def input_shape(self): |
| | return (3, 32, 32) |
| |
|
| | @property |
| | def output_shape(self): |
| | return (3, 32, 32) |
| |
|
| | def prepare_init_args_and_inputs_for_common(self): |
| | init_dict = { |
| | "block_out_channels": [32, 64], |
| | "in_channels": 3, |
| | "out_channels": 3, |
| | "down_block_types": ["DownEncoderBlock2D", "DownEncoderBlock2D"], |
| | "latent_channels": 4, |
| | "layers_per_block": 2, |
| | } |
| | inputs_dict = self.dummy_input |
| | return init_dict, inputs_dict |
| |
|
| | def test_gradient_checkpointing_is_applied(self): |
| | expected_set = {"Encoder", "TemporalDecoder", "UNetMidBlock2D"} |
| | super().test_gradient_checkpointing_is_applied(expected_set=expected_set) |
| |
|