diff --git a/optimizer_dadapt.json b/optimizer_dadapt.json index 9f45714..f6b57d0 100644 --- a/optimizer_dadapt.json +++ b/optimizer_dadapt.json @@ -46,6 +46,7 @@ "decouple": true }, "text_encoder_freezing": { - "unfreeze_last_n_layers": 6 - } + "unfreeze_last_n_layers": null + }, + "apply_grad_scaler_step_tweaks": true }