diff --git a/trl/trainer/kto_config.py b/trl/trainer/kto_config.py index 9c357dbdb1..bfafa9a32c 100644 --- a/trl/trainer/kto_config.py +++ b/trl/trainer/kto_config.py @@ -81,7 +81,7 @@ class KTOConfig(TrainingArguments): """ learning_rate: float = field( - default=1e-6, + default=5e-7, metadata={ "help": "Initial learning rate for `AdamW` optimizer. The default value replaces that of " "`transformers.TrainingArguments`."