diffusers/tests/test_modeling_utils.py

# coding=utf-8
# Copyright 2022 HuggingFace Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


import tempfile
import unittest

import torch

from diffusers import DDIM, DDPM, PNDM, DDIMScheduler, DDPMScheduler, LatentDiffusion, PNDMScheduler, UNetModel
from diffusers.configuration_utils import ConfigMixin
from diffusers.pipeline_utils import DiffusionPipeline
from diffusers.testing_utils import floats_tensor, slow, torch_device


torch.backends.cuda.matmul.allow_tf32 = False


class ConfigTester(unittest.TestCase):
    def test_load_not_from_mixin(self):
        with self.assertRaises(ValueError):
            ConfigMixin.from_config("dummy_path")

    def test_save_load(self):
        class SampleObject(ConfigMixin):
            config_name = "config.json"

            def __init__(
                self,
                a=2,
                b=5,
                c=(2, 5),
                d="for diffusion",
                e=[1, 3],
            ):
                self.register(a=a, b=b, c=c, d=d, e=e)

        obj = SampleObject()
        config = obj.config

        assert config["a"] == 2
        assert config["b"] == 5
        assert config["c"] == (2, 5)
        assert config["d"] == "for diffusion"
        assert config["e"] == [1, 3]

        with tempfile.TemporaryDirectory() as tmpdirname:
            obj.save_config(tmpdirname)
            new_obj = SampleObject.from_config(tmpdirname)
            new_config = new_obj.config

        assert config.pop("c") == (2, 5)  # instantiated as tuple
        assert new_config.pop("c") == [2, 5]  # saved & loaded as list because of json
        assert config == new_config


class ModelTesterMixin(unittest.TestCase):
    @property
    def dummy_input(self):
        batch_size = 4
        num_channels = 3
        sizes = (32, 32)

        noise = floats_tensor((batch_size, num_channels) + sizes).to(torch_device)
        time_step = torch.tensor([10]).to(torch_device)

        return (noise, time_step)

    def test_from_pretrained_save_pretrained(self):
        model = UNetModel(ch=32, ch_mult=(1, 2), num_res_blocks=2, attn_resolutions=(16,), resolution=32)
        model.to(torch_device)

        with tempfile.TemporaryDirectory() as tmpdirname:
            model.save_pretrained(tmpdirname)
            new_model = UNetModel.from_pretrained(tmpdirname)
            new_model.to(torch_device)

        dummy_input = self.dummy_input

        image = model(*dummy_input)
        new_image = new_model(*dummy_input)

        assert (image - new_image).abs().sum() < 1e-5, "Models don't give the same forward pass"

    def test_from_pretrained_hub(self):
        model = UNetModel.from_pretrained("fusing/ddpm_dummy")
        model.to(torch_device)

        image = model(*self.dummy_input)

        assert image is not None, "Make sure output is not None"


class PipelineTesterMixin(unittest.TestCase):
    def test_from_pretrained_save_pretrained(self):
        # 1. Load models
        model = UNetModel(ch=32, ch_mult=(1, 2), num_res_blocks=2, attn_resolutions=(16,), resolution=32)
        schedular = DDPMScheduler(timesteps=10)

        ddpm = DDPM(model, schedular)

        with tempfile.TemporaryDirectory() as tmpdirname:
            ddpm.save_pretrained(tmpdirname)
            new_ddpm = DDPM.from_pretrained(tmpdirname)

        generator = torch.manual_seed(0)

        image = ddpm(generator=generator)
        generator = generator.manual_seed(0)
        new_image = new_ddpm(generator=generator)

        assert (image - new_image).abs().sum() < 1e-5, "Models don't give the same forward pass"

    @slow
    def test_from_pretrained_hub(self):
        model_path = "fusing/ddpm-cifar10"

        ddpm = DDPM.from_pretrained(model_path)
        ddpm_from_hub = DiffusionPipeline.from_pretrained(model_path)

        ddpm.noise_scheduler.num_timesteps = 10
        ddpm_from_hub.noise_scheduler.num_timesteps = 10

        generator = torch.manual_seed(0)

        image = ddpm(generator=generator)
        generator = generator.manual_seed(0)
        new_image = ddpm_from_hub(generator=generator)

        assert (image - new_image).abs().sum() < 1e-5, "Models don't give the same forward pass"

    @slow
    def test_ddpm_cifar10(self):
        generator = torch.manual_seed(0)
        model_id = "fusing/ddpm-cifar10"

        unet = UNetModel.from_pretrained(model_id)
        noise_scheduler = DDPMScheduler.from_config(model_id)
        noise_scheduler = noise_scheduler.set_format("pt")

        ddpm = DDPM(unet=unet, noise_scheduler=noise_scheduler)
        image = ddpm(generator=generator)

        image_slice = image[0, -1, -3:, -3:].cpu()

        assert image.shape == (1, 3, 32, 32)
        expected_slice = torch.tensor([0.2250, 0.3375, 0.2360, 0.0930, 0.3440, 0.3156, 0.1937, 0.3585, 0.1761])
        assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2

    @slow
    def test_ddim_cifar10(self):
        generator = torch.manual_seed(0)
        model_id = "fusing/ddpm-cifar10"

        unet = UNetModel.from_pretrained(model_id)
        noise_scheduler = DDIMScheduler(tensor_format="pt")

        ddim = DDIM(unet=unet, noise_scheduler=noise_scheduler)
        image = ddim(generator=generator, eta=0.0)

        image_slice = image[0, -1, -3:, -3:].cpu()

        assert image.shape == (1, 3, 32, 32)
        expected_slice = torch.tensor(
            [-0.7383, -0.7385, -0.7298, -0.7364, -0.7414, -0.7239, -0.6737, -0.6813, -0.7068]
        )
        assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2

    @slow
    def test_pndm_cifar10(self):
        generator = torch.manual_seed(0)
        model_id = "fusing/ddpm-cifar10"

        unet = UNetModel.from_pretrained(model_id)
        noise_scheduler = PNDMScheduler(tensor_format="pt")

        pndm = PNDM(unet=unet, noise_scheduler=noise_scheduler)
        image = pndm(generator=generator)

        image_slice = image[0, -1, -3:, -3:].cpu()

        assert image.shape == (1, 3, 32, 32)
        expected_slice = torch.tensor(
            [-0.7888, -0.7870, -0.7759, -0.7823, -0.8014, -0.7608, -0.6818, -0.7130, -0.7471]
        )
        assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2

    @slow
    def test_ldm_text2img(self):
        model_id = "fusing/latent-diffusion-text2im-large"
        ldm = LatentDiffusion.from_pretrained(model_id)

        prompt = "A painting of a squirrel eating a burger"
        generator = torch.manual_seed(0)
        image = ldm([prompt], generator=generator, num_inference_steps=20)

        image_slice = image[0, -1, -3:, -3:].cpu()
        print(image_slice.shape)

        assert image.shape == (1, 3, 256, 256)
        expected_slice = torch.tensor([0.7295, 0.7358, 0.7256, 0.7435, 0.7095, 0.6884, 0.7325, 0.6921, 0.6458])
        assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2
add first template for DDPM forward 2022-05-31 06:27:59 -06:00			`# coding=utf-8`
			`# Copyright 2022 HuggingFace Inc.`
			`#`
			`# Licensed under the Apache License, Version 2.0 (the "License");`
			`# you may not use this file except in compliance with the License.`
			`# You may obtain a copy of the License at`
			`#`
			`# http://www.apache.org/licenses/LICENSE-2.0`
			`#`
			`# Unless required by applicable law or agreed to in writing, software`
			`# distributed under the License is distributed on an "AS IS" BASIS,`
			`# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`# See the License for the specific language governing permissions and`
			`# limitations under the License.`

fix random seed 2022-06-07 10:20:14 -06:00
add first template for DDPM forward 2022-05-31 06:27:59 -06:00			`import tempfile`
			`import unittest`

			`import torch`

Move the training example 2022-06-14 03:33:24 -06:00			`from diffusers import DDIM, DDPM, PNDM, DDIMScheduler, DDPMScheduler, LatentDiffusion, PNDMScheduler, UNetModel`
finish transformers removal 2022-06-09 04:36:37 -06:00			`from diffusers.configuration_utils import ConfigMixin`
fix setup 2022-06-09 06:06:58 -06:00			`from diffusers.pipeline_utils import DiffusionPipeline`
finish refactor 2022-06-12 15:20:39 -06:00			`from diffusers.testing_utils import floats_tensor, slow, torch_device`
add first template for DDPM forward 2022-05-31 06:27:59 -06:00

make tests pass 2022-06-12 11:59:39 -06:00			`torch.backends.cuda.matmul.allow_tf32 = False`
add first template for DDPM forward 2022-05-31 06:27:59 -06:00

finish transformers removal 2022-06-09 04:36:37 -06:00			`class ConfigTester(unittest.TestCase):`
			`def test_load_not_from_mixin(self):`
			`with self.assertRaises(ValueError):`
			`ConfigMixin.from_config("dummy_path")`

			`def test_save_load(self):`
			`class SampleObject(ConfigMixin):`
			`config_name = "config.json"`

			`def __init__(`
			`self,`
			`a=2,`
			`b=5,`
			`c=(2, 5),`
			`d="for diffusion",`
			`e=[1, 3],`
			`):`
			`self.register(a=a, b=b, c=c, d=d, e=e)`

			`obj = SampleObject()`
			`config = obj.config`

			`assert config["a"] == 2`
			`assert config["b"] == 5`
			`assert config["c"] == (2, 5)`
			`assert config["d"] == "for diffusion"`
			`assert config["e"] == [1, 3]`

			`with tempfile.TemporaryDirectory() as tmpdirname:`
			`obj.save_config(tmpdirname)`
			`new_obj = SampleObject.from_config(tmpdirname)`
			`new_config = new_obj.config`

			`assert config.pop("c") == (2, 5) # instantiated as tuple`
			`assert new_config.pop("c") == [2, 5] # saved & loaded as list because of json`
			`assert config == new_config`


add first template for DDPM forward 2022-05-31 06:27:59 -06:00			`class ModelTesterMixin(unittest.TestCase):`
add another test 2022-05-31 06:46:20 -06:00			`@property`
			`def dummy_input(self):`
up 2022-06-07 07:03:53 -06:00			`batch_size = 4`
add another test 2022-05-31 06:46:20 -06:00			`num_channels = 3`
			`sizes = (32, 32)`

make tests pass 2022-06-12 11:59:39 -06:00			`noise = floats_tensor((batch_size, num_channels) + sizes).to(torch_device)`
add more tests schedulers 2022-06-12 13:56:13 -06:00			`time_step = torch.tensor([10]).to(torch_device)`
add another test 2022-05-31 06:46:20 -06:00
			`return (noise, time_step)`

add first template for DDPM forward 2022-05-31 06:27:59 -06:00			`def test_from_pretrained_save_pretrained(self):`
improve 2022-06-06 09:03:41 -06:00			`model = UNetModel(ch=32, ch_mult=(1, 2), num_res_blocks=2, attn_resolutions=(16,), resolution=32)`
add more tests schedulers 2022-06-12 13:56:13 -06:00			`model.to(torch_device)`
add first template for DDPM forward 2022-05-31 06:27:59 -06:00
			`with tempfile.TemporaryDirectory() as tmpdirname:`
			`model.save_pretrained(tmpdirname)`
			`new_model = UNetModel.from_pretrained(tmpdirname)`
add more tests schedulers 2022-06-12 13:56:13 -06:00			`new_model.to(torch_device)`
add first template for DDPM forward 2022-05-31 06:27:59 -06:00
add another test 2022-05-31 06:46:20 -06:00			`dummy_input = self.dummy_input`
add first template for DDPM forward 2022-05-31 06:27:59 -06:00
add another test 2022-05-31 06:46:20 -06:00			`image = model(*dummy_input)`
			`new_image = new_model(*dummy_input)`
add first template for DDPM forward 2022-05-31 06:27:59 -06:00
			`assert (image - new_image).abs().sum() < 1e-5, "Models don't give the same forward pass"`
add another test 2022-05-31 06:46:20 -06:00
			`def test_from_pretrained_hub(self):`
			`model = UNetModel.from_pretrained("fusing/ddpm_dummy")`
add more tests schedulers 2022-06-12 13:56:13 -06:00			`model.to(torch_device)`
add another test 2022-05-31 06:46:20 -06:00
			`image = model(*self.dummy_input)`

			`assert image is not None, "Make sure output is not None"`
add pretrained model and pretrained sampler 2022-06-01 16:25:48 -06:00

fix issues with loading, add test for pipeline 2022-06-07 07:39:47 -06:00			`class PipelineTesterMixin(unittest.TestCase):`
			`def test_from_pretrained_save_pretrained(self):`
			`# 1. Load models`
			`model = UNetModel(ch=32, ch_mult=(1, 2), num_res_blocks=2, attn_resolutions=(16,), resolution=32)`
rename schedulers 2022-06-13 02:39:53 -06:00			`schedular = DDPMScheduler(timesteps=10)`
fix issues with loading, add test for pipeline 2022-06-07 07:39:47 -06:00
			`ddpm = DDPM(model, schedular)`

			`with tempfile.TemporaryDirectory() as tmpdirname:`
			`ddpm.save_pretrained(tmpdirname)`
			`new_ddpm = DDPM.from_pretrained(tmpdirname)`
fix random seed 2022-06-07 10:20:14 -06:00
			`generator = torch.manual_seed(0)`
fix issues with loading, add test for pipeline 2022-06-07 07:39:47 -06:00
fix tests 2022-06-07 07:43:08 -06:00			`image = ddpm(generator=generator)`
fix random seed 2022-06-07 10:20:14 -06:00			`generator = generator.manual_seed(0)`
fix tests 2022-06-07 07:43:08 -06:00			`new_image = new_ddpm(generator=generator)`
fix issues with loading, add test for pipeline 2022-06-07 07:39:47 -06:00
			`assert (image - new_image).abs().sum() < 1e-5, "Models don't give the same forward pass"`

			`@slow`
			`def test_from_pretrained_hub(self):`
			`model_path = "fusing/ddpm-cifar10"`

			`ddpm = DDPM.from_pretrained(model_path)`
			`ddpm_from_hub = DiffusionPipeline.from_pretrained(model_path)`

			`ddpm.noise_scheduler.num_timesteps = 10`
			`ddpm_from_hub.noise_scheduler.num_timesteps = 10`

fix random seed 2022-06-07 10:20:14 -06:00			`generator = torch.manual_seed(0)`
fix issues with loading, add test for pipeline 2022-06-07 07:39:47 -06:00
fix tests 2022-06-07 07:43:08 -06:00			`image = ddpm(generator=generator)`
fix random seed 2022-06-07 10:20:14 -06:00			`generator = generator.manual_seed(0)`
fix tests 2022-06-07 07:43:08 -06:00			`new_image = ddpm_from_hub(generator=generator)`
fix issues with loading, add test for pipeline 2022-06-07 07:39:47 -06:00
			`assert (image - new_image).abs().sum() < 1e-5, "Models don't give the same forward pass"`
add first version of ddim 2022-06-08 03:42:31 -06:00
			`@slow`
			`def test_ddpm_cifar10(self):`
			`generator = torch.manual_seed(0)`
			`model_id = "fusing/ddpm-cifar10"`

save intermediate 2022-06-10 05:12:23 -06:00			`unet = UNetModel.from_pretrained(model_id)`
rename schedulers 2022-06-13 02:39:53 -06:00			`noise_scheduler = DDPMScheduler.from_config(model_id)`
finish refactor 2022-06-12 15:20:39 -06:00			`noise_scheduler = noise_scheduler.set_format("pt")`
save intermediate 2022-06-10 05:12:23 -06:00
			`ddpm = DDPM(unet=unet, noise_scheduler=noise_scheduler)`
add first version of ddim 2022-06-08 03:42:31 -06:00			`image = ddpm(generator=generator)`

			`image_slice = image[0, -1, -3:, -3:].cpu()`

			`assert image.shape == (1, 3, 32, 32)`
			`expected_slice = torch.tensor([0.2250, 0.3375, 0.2360, 0.0930, 0.3440, 0.3156, 0.1937, 0.3585, 0.1761])`
			`assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2`

			`@slow`
			`def test_ddim_cifar10(self):`
			`generator = torch.manual_seed(0)`
			`model_id = "fusing/ddpm-cifar10"`

save intermediate 2022-06-10 05:12:23 -06:00			`unet = UNetModel.from_pretrained(model_id)`
finish refactor 2022-06-12 15:20:39 -06:00			`noise_scheduler = DDIMScheduler(tensor_format="pt")`
save intermediate 2022-06-10 05:12:23 -06:00
			`ddim = DDIM(unet=unet, noise_scheduler=noise_scheduler)`
add first version of ddim 2022-06-08 03:42:31 -06:00			`image = ddim(generator=generator, eta=0.0)`

			`image_slice = image[0, -1, -3:, -3:].cpu()`

			`assert image.shape == (1, 3, 32, 32)`
fix setup 2022-06-09 06:06:58 -06:00			`expected_slice = torch.tensor(`
			`[-0.7383, -0.7385, -0.7298, -0.7364, -0.7414, -0.7239, -0.6737, -0.6813, -0.7068]`
			`)`
add first version of ddim 2022-06-08 03:42:31 -06:00			`assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2`
add test for ldm 2022-06-10 10:37:45 -06:00
improve pndm 2022-06-13 10:29:22 -06:00			`@slow`
			`def test_pndm_cifar10(self):`
			`generator = torch.manual_seed(0)`
			`model_id = "fusing/ddpm-cifar10"`

			`unet = UNetModel.from_pretrained(model_id)`
			`noise_scheduler = PNDMScheduler(tensor_format="pt")`

			`pndm = PNDM(unet=unet, noise_scheduler=noise_scheduler)`
			`image = pndm(generator=generator)`

			`image_slice = image[0, -1, -3:, -3:].cpu()`

			`assert image.shape == (1, 3, 32, 32)`
			`expected_slice = torch.tensor(`
			`[-0.7888, -0.7870, -0.7759, -0.7823, -0.8014, -0.7608, -0.6818, -0.7130, -0.7471]`
			`)`
			`assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2`

add test for ldm 2022-06-10 10:37:45 -06:00			`@slow`
			`def test_ldm_text2img(self):`
			`model_id = "fusing/latent-diffusion-text2im-large"`
			`ldm = LatentDiffusion.from_pretrained(model_id)`

			`prompt = "A painting of a squirrel eating a burger"`
			`generator = torch.manual_seed(0)`
			`image = ldm([prompt], generator=generator, num_inference_steps=20)`

			`image_slice = image[0, -1, -3:, -3:].cpu()`
			`print(image_slice.shape)`

			`assert image.shape == (1, 3, 256, 256)`
			`expected_slice = torch.tensor([0.7295, 0.7358, 0.7256, 0.7435, 0.7095, 0.6884, 0.7325, 0.6921, 0.6458])`
update 2022-06-12 11:12:01 -06:00			`assert (image_slice.flatten() - expected_slice).abs().max() < 1e-2`