We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 8e1ee62 commit 7cd0109Copy full SHA for 7cd0109
1 file changed
src/together/resources/finetune.py
@@ -219,6 +219,9 @@ def create_finetune_request(
219
f"Parameter simpo_gamma was set to {simpo_gamma}. "
220
"SimPO training detected. Reference logits will not be used."
221
)
222
+ else:
223
+ dpo_reference_free=None
224
+
225
training_method_cls = TrainingMethodDPO(
226
dpo_beta=dpo_beta,
227
dpo_normalize_logratios_by_length=dpo_normalize_logratios_by_length,
0 commit comments