We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 92d7e01 commit 51b96fcCopy full SHA for 51b96fc
src/together/resources/finetune.py
@@ -189,7 +189,7 @@ def create_finetune_request(
189
raise ValueError(
190
"dpo_normalize_logratios_by_length=True is only supported for DPO training"
191
)
192
- if rpo_alpha is not None:
+ if rpo_alpha is not None:
193
if training_method != "dpo":
194
raise ValueError("rpo_alpha is only supported for DPO training")
195
if not rpo_alpha >= 0.0:
0 commit comments