From 2f52832209267d904d53b799534549e9f1484aa7 Mon Sep 17 00:00:00 2001 From: Victor Hall Date: Mon, 18 Sep 2023 14:54:43 -0400 Subject: [PATCH] fix trainSD21.json and advanced tweaking ema param names --- doc/ADVANCED_TWEAKING.md | 2 +- trainSD21.json | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/doc/ADVANCED_TWEAKING.md b/doc/ADVANCED_TWEAKING.md index 894a894..310f06e 100644 --- a/doc/ADVANCED_TWEAKING.md +++ b/doc/ADVANCED_TWEAKING.md @@ -230,7 +230,7 @@ In this mode, the EMA model will be saved alongside the regular checkpoint from For more information, consult the [research paper](https://arxiv.org/abs/2101.08482) or continue reading the tuning notes below. **Parameters:** - `--ema_decay_rate`: Determines the EMA decay rate. It defines how much the EMA model is updated from training at each update. Values should be close to 1 but not exceed it. Activating this parameter triggers the EMA decay feature. -- `--ema_decay_target`: Set the EMA decay target value within the (0,1) range. The `ema_decay_rate` is computed based on the relation: decay_rate to the power of (total_steps/decay_interval) equals decay_target. Enabling this parameter will override `ema_decay_rate` and will enable EMA feature. +- `--ema_strength_target`: Set the EMA decay target value within the (0,1) range. The `ema_decay_rate` is computed based on the relation: decay_rate to the power of (total_steps/decay_interval) equals decay_target. Enabling this parameter will override `ema_decay_rate` and will enable EMA feature. - `--ema_update_interval`: Set the interval in steps between EMA updates. The update occurs at each optimizer step. If you use grad_accum, actual update interval will be multipled by your grad_accum value. - `--ema_device`: Choose between `cpu` and `cuda` for EMA. Opting for 'cpu' takes around 4 seconds per update and uses approximately 3.2GB RAM, while 'cuda' is much faster but requires a similar amount of VRAM. - `--ema_sample_raw_training`: Activate to display samples from the trained model, mirroring conventional training. They will not be presented by default with EMA decay enabled. diff --git a/trainSD21.json b/trainSD21.json index 01347ef..da3672c 100644 --- a/trainSD21.json +++ b/trainSD21.json @@ -44,7 +44,7 @@ "load_settings_every_epoch": false, "min_snr_gamma": null, "ema_decay_rate": null, - "ema_decay_target": null, + "ema_strength_target": null, "ema_update_interval": null, "ema_device": null, "ema_sample_raw_training": false,