diffusers/tests/test_models_vq.py

# coding=utf-8
# Copyright 2022 HuggingFace Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import unittest

import torch

from diffusers import VQModel
from diffusers.testing_utils import floats_tensor, torch_device

from .test_modeling_common import ModelTesterMixin


torch.backends.cuda.matmul.allow_tf32 = False


class VQModelTests(ModelTesterMixin, unittest.TestCase):
    model_class = VQModel

    @property
    def dummy_input(self, sizes=(32, 32)):
        batch_size = 4
        num_channels = 3

        image = floats_tensor((batch_size, num_channels) + sizes).to(torch_device)

        return {"sample": image}

    @property
    def input_shape(self):
        return (3, 32, 32)

    @property
    def output_shape(self):
        return (3, 32, 32)

    def prepare_init_args_and_inputs_for_common(self):
        init_dict = {
            "block_out_channels": [32, 64],
            "in_channels": 3,
            "out_channels": 3,
            "down_block_types": ["DownEncoderBlock2D", "DownEncoderBlock2D"],
            "up_block_types": ["UpDecoderBlock2D", "UpDecoderBlock2D"],
            "latent_channels": 3,
        }
        inputs_dict = self.dummy_input
        return init_dict, inputs_dict

    def test_forward_signature(self):
        pass

    def test_training(self):
        pass

    def test_from_pretrained_hub(self):
        model, loading_info = VQModel.from_pretrained("fusing/vqgan-dummy", output_loading_info=True)
        self.assertIsNotNone(model)
        self.assertEqual(len(loading_info["missing_keys"]), 0)

        model.to(torch_device)
        image = model(**self.dummy_input)

        assert image is not None, "Make sure output is not None"

    def test_output_pretrained(self):
        model = VQModel.from_pretrained("fusing/vqgan-dummy")
        model.to(torch_device).eval()

        torch.manual_seed(0)
        if torch.cuda.is_available():
            torch.cuda.manual_seed_all(0)

        image = torch.randn(1, model.config.in_channels, model.config.sample_size, model.config.sample_size)
        image = image.to(torch_device)
        with torch.no_grad():
            # Warmup pass when using mps (see #372)
            if torch_device == "mps":
                _ = model(image)
            output = model(image).sample

        output_slice = output[0, -1, -3:, -3:].flatten().cpu()
        # fmt: off
        expected_output_slice = torch.tensor([-0.0153, -0.4044, -0.1880, -0.5161, -0.2418, -0.4072, -0.1612, -0.0633, -0.0143])
        # fmt: on
        self.assertTrue(torch.allclose(output_slice, expected_output_slice, atol=1e-3))
split tests_modeling_utils (#223) * split tests_modeling_utils * Fix SD tests .to(device) * fix merge * Fix style Co-authored-by: anton-l <anton@huggingface.co> 2022-08-24 05:27:16 -06:00			`# coding=utf-8`
			`# Copyright 2022 HuggingFace Inc.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`

			`import unittest`

			`import torch`

			`from diffusers import VQModel`
			`from diffusers.testing_utils import floats_tensor, torch_device`

			`from .test_modeling_common import ModelTesterMixin`


[Tests] Make sure tests are on GPU (#269) * [Tests] Make sure tests are on GPU * move more models * speed up tests 2022-08-29 07:58:11 -06:00			`torch.backends.cuda.matmul.allow_tf32 = False`


split tests_modeling_utils (#223) * split tests_modeling_utils * Fix SD tests .to(device) * fix merge * Fix style Co-authored-by: anton-l <anton@huggingface.co> 2022-08-24 05:27:16 -06:00			`class VQModelTests(ModelTesterMixin, unittest.TestCase):`
			`model_class = VQModel`

			`@property`
			`def dummy_input(self, sizes=(32, 32)):`
			`batch_size = 4`
			`num_channels = 3`

			`image = floats_tensor((batch_size, num_channels) + sizes).to(torch_device)`

			`return {"sample": image}`

			`@property`
			`def input_shape(self):`
			`return (3, 32, 32)`

			`@property`
			`def output_shape(self):`
			`return (3, 32, 32)`

			`def prepare_init_args_and_inputs_for_common(self):`
			`init_dict = {`
			`"block_out_channels": [32, 64],`
			`"in_channels": 3,`
			`"out_channels": 3,`
			`"down_block_types": ["DownEncoderBlock2D", "DownEncoderBlock2D"],`
			`"up_block_types": ["UpDecoderBlock2D", "UpDecoderBlock2D"],`
			`"latent_channels": 3,`
			`}`
			`inputs_dict = self.dummy_input`
			`return init_dict, inputs_dict`

			`def test_forward_signature(self):`
			`pass`

			`def test_training(self):`
			`pass`

			`def test_from_pretrained_hub(self):`
			`model, loading_info = VQModel.from_pretrained("fusing/vqgan-dummy", output_loading_info=True)`
			`self.assertIsNotNone(model)`
			`self.assertEqual(len(loading_info["missing_keys"]), 0)`

			`model.to(torch_device)`
			`image = model(**self.dummy_input)`

			`assert image is not None, "Make sure output is not None"`

			`def test_output_pretrained(self):`
			`model = VQModel.from_pretrained("fusing/vqgan-dummy")`
[Tests] Make sure tests are on GPU (#269) * [Tests] Make sure tests are on GPU * move more models * speed up tests 2022-08-29 07:58:11 -06:00			`model.to(torch_device).eval()`
split tests_modeling_utils (#223) * split tests_modeling_utils * Fix SD tests .to(device) * fix merge * Fix style Co-authored-by: anton-l <anton@huggingface.co> 2022-08-24 05:27:16 -06:00
			`torch.manual_seed(0)`
			`if torch.cuda.is_available():`
			`torch.cuda.manual_seed_all(0)`

			`image = torch.randn(1, model.config.in_channels, model.config.sample_size, model.config.sample_size)`
[Tests] Make sure tests are on GPU (#269) * [Tests] Make sure tests are on GPU * move more models * speed up tests 2022-08-29 07:58:11 -06:00			`image = image.to(torch_device)`
split tests_modeling_utils (#223) * split tests_modeling_utils * Fix SD tests .to(device) * fix merge * Fix style Co-authored-by: anton-l <anton@huggingface.co> 2022-08-24 05:27:16 -06:00			`with torch.no_grad():`
Inference support for `mps` device (#355) * Initial support for mps in Stable Diffusion pipeline. * Initial "warmup" implementation when using mps. * Make some deterministic tests pass with mps. * Disable training tests when using mps. * SD: generate latents in CPU then move to device. This is especially important when using the mps device, because generators are not supported there. See for example https://github.com/pytorch/pytorch/issues/84288. In addition, the other pipelines seem to use the same approach: generate the random samples then move to the appropriate device. After this change, generating an image in MPS produces the same result as when using the CPU, if the same seed is used. * Remove prints. * Pass AutoencoderKL test_output_pretrained with mps. Sampling from `posterior` must be done in CPU. * Style * Do not use torch.long for log op in mps device. * Perform incompatible padding ops in CPU. UNet tests now pass. See https://github.com/pytorch/pytorch/issues/84535 * Style: fix import order. * Remove unused symbols. * Remove MPSWarmupMixin, do not apply automatically. We do apply warmup in the tests, but not during normal use. This adopts some PR suggestions by @patrickvonplaten. * Add comment for mps fallback to CPU step. * Add README_mps.md for mps installation and use. * Apply `black` to modified files. * Restrict README_mps to SD, show measures in table. * Make PNDM indexing compatible with mps. Addresses #239. * Do not use float64 when using LDMScheduler. Fixes #358. * Fix typo identified by @patil-suraj Co-authored-by: Suraj Patil <surajp815@gmail.com> * Adapt example to new output style. * Restore 1:1 results reproducibility with CompVis. However, mps latents need to be generated in CPU because generators don't work in the mps device. * Move PyTorch nightly to requirements. * Adapt `test_scheduler_outputs_equivalence` ton MPS. * mps: skip training tests instead of ignoring silently. * Make VQModel tests pass on mps. * mps ddim tests: warmup, increase tolerance. * ScoreSdeVeScheduler indexing made mps compatible. * Make ldm pipeline tests pass using warmup. * Style * Simplify casting as suggested in PR. * Add Known Issues to readme. * `isort` import order. * Remove _mps_warmup helpers from ModelMixin. And just make changes to the tests. * Skip tests using unittest decorator for consistency. * Remove temporary var. * Remove spurious blank space. * Remove unused symbol. * Remove README_mps. Co-authored-by: Suraj Patil <surajp815@gmail.com> Co-authored-by: Patrick von Platen <patrick.v.platen@gmail.com> 2022-09-08 05:37:36 -06:00			`# Warmup pass when using mps (see #372)`
			`if torch_device == "mps":`
			`_ = model(image)`
[ModelOutputs] Replace dict outputs with Dict/Dataclass and allow to return tuples (#334) * add outputs for models * add for pipelines * finish schedulers * better naming * adapt tests as well * replace dict access with . access * make schedulers works * finish * correct readme * make bcp compatible * up * small fix * finish * more fixes * more fixes * Apply suggestions from code review Co-authored-by: Suraj Patil <surajp815@gmail.com> Co-authored-by: Pedro Cuenca <pedro@huggingface.co> * Update src/diffusers/models/vae.py Co-authored-by: Pedro Cuenca <pedro@huggingface.co> * Adapt model outputs * Apply more suggestions * finish examples * correct Co-authored-by: Suraj Patil <surajp815@gmail.com> Co-authored-by: Pedro Cuenca <pedro@huggingface.co> 2022-09-05 06:49:26 -06:00			`output = model(image).sample`
split tests_modeling_utils (#223) * split tests_modeling_utils * Fix SD tests .to(device) * fix merge * Fix style Co-authored-by: anton-l <anton@huggingface.co> 2022-08-24 05:27:16 -06:00
[Tests] Make sure tests are on GPU (#269) * [Tests] Make sure tests are on GPU * move more models * speed up tests 2022-08-29 07:58:11 -06:00			`output_slice = output[0, -1, -3:, -3:].flatten().cpu()`
split tests_modeling_utils (#223) * split tests_modeling_utils * Fix SD tests .to(device) * fix merge * Fix style Co-authored-by: anton-l <anton@huggingface.co> 2022-08-24 05:27:16 -06:00			`# fmt: off`
			`expected_output_slice = torch.tensor([-0.0153, -0.4044, -0.1880, -0.5161, -0.2418, -0.4072, -0.1612, -0.0633, -0.0143])`
			`# fmt: on`
update expected results of slow tests (#268) * update expected results of slow tests * relax sum and mean tests * Print shapes when reporting exception * formatting * fix sentence * relax test_stable_diffusion_fast_ddim for gpu fp16 * relax flakey tests on GPU * added comment on large tolerences * black * format * set scheduler seed * added generator * use np.isclose * set num_inference_steps to 50 * fix dep. warning * update expected_slice * preprocess if image * updated expected results * updated expected from CI * pass generator to VAE * undo change back to orig * use orignal * revert back the expected on cpu * revert back values for CPU * more undo * update result after using gen * update mean * set generator for mps * update expected on CI server * undo * use new seed every time * cpu manual seed * reduce num_inference_steps * style * use generator for randn Co-authored-by: Patrick von Platen <patrick.v.platen@gmail.com> 2022-09-12 07:49:39 -06:00			`self.assertTrue(torch.allclose(output_slice, expected_output_slice, atol=1e-3))`