Skip to content

Commit 5f8b188

Browse files
committed
Force normalization for simpo
1 parent 0719212 commit 5f8b188

1 file changed

Lines changed: 3 additions & 1 deletion

File tree

src/together/resources/finetune.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -215,9 +215,11 @@ def create_finetune_request(
215215
elif training_method == "dpo":
216216
if simpo_gamma is not None and simpo_gamma > 0:
217217
dpo_reference_free = True
218+
dpo_normalize_logratios_by_length = True
218219
rprint(
219220
f"Parameter simpo_gamma was set to {simpo_gamma}. "
220-
"SimPO training detected. Reference logits will not be used."
221+
"SimPO training detected. Reference logits will not be used "
222+
"and length normalization of logps will be enabled."
221223
)
222224
else:
223225
dpo_reference_free = False

0 commit comments

Comments
 (0)