2023-02-25 13:05:22 -07:00
{
"doc" : {
"optimizer" : "adamw, adamw8bit, lion" ,
"optimizer_desc" : "'adamw' in standard 32bit, 'adamw8bit' is bitsandbytes, 'lion' is lucidrains" ,
"lr" : "learning rate, if null wil use CLI or main JSON config value" ,
"betas" : "exponential decay rates for the moment estimates" ,
"epsilon" : "value added to denominator for numerical stability, unused for lion" ,
2023-03-01 16:13:43 -07:00
"weight_decay" : "weight decay (L2 penalty)" ,
2023-03-02 14:36:00 -07:00
"text_encoder_lr_scale" : "scale the text encoder LR relative to the Unet LR. for example, if `lr` is 2e-6 and `text_encoder_lr_scale` is 0.5, the text encoder's LR will be set to `1e-6`."
2023-02-25 13:05:22 -07:00
} ,
"optimizer" : "adamw8bit" ,
2023-02-26 17:11:42 -07:00
"lr" : 1e-6 ,
2023-02-25 13:05:22 -07:00
"betas" : [ 0.9 , 0.999 ] ,
"epsilon" : 1e-8 ,
2023-03-01 16:13:43 -07:00
"weight_decay" : 0.010 ,
2023-03-25 18:09:06 -06:00
"text_encoder_lr_scale" : 0.50
2023-02-26 08:00:42 -07:00
}