diff --git a/train.py b/train.py index 749c5c7..1312b46 100644 --- a/train.py +++ b/train.py @@ -891,7 +891,7 @@ def main(args): train_dataloader = build_torch_dataloader(train_batch, batch_size=args.batch_size) - unet.train() if not args.disable_unet_training else unet.eval() + unet.train() if (args.gradient_checkpointing or not args.disable_unet_training) else unet.eval() text_encoder.train() if not args.disable_textenc_training else text_encoder.eval() logging.info(f" unet device: {unet.device}, precision: {unet.dtype}, training: {unet.training}")